<86>Sep 7 00:01:47 userdel[4081645]: delete user 'rooter' <86>Sep 7 00:01:47 userdel[4081645]: removed group 'rooter' owned by 'rooter' <86>Sep 7 00:01:47 userdel[4081645]: removed shadow group 'rooter' owned by 'rooter' <86>Sep 7 00:01:47 groupadd[4081652]: group added to /etc/group: name=rooter, GID=1211 <86>Sep 7 00:01:47 groupadd[4081652]: group added to /etc/gshadow: name=rooter <86>Sep 7 00:01:47 groupadd[4081652]: new group: name=rooter, GID=1211 <86>Sep 7 00:01:47 useradd[4081658]: new user: name=rooter, UID=1211, GID=1211, home=/root, shell=/bin/bash, from=none <86>Sep 7 00:01:47 userdel[4081668]: delete user 'builder' <86>Sep 7 00:01:47 userdel[4081668]: removed group 'builder' owned by 'builder' <86>Sep 7 00:01:47 userdel[4081668]: removed shadow group 'builder' owned by 'builder' <86>Sep 7 00:01:47 groupadd[4081675]: group added to /etc/group: name=builder, GID=1212 <86>Sep 7 00:01:47 groupadd[4081675]: group added to /etc/gshadow: name=builder <86>Sep 7 00:01:47 groupadd[4081675]: new group: name=builder, GID=1212 <86>Sep 7 00:01:47 useradd[4081681]: new user: name=builder, UID=1212, GID=1212, home=/usr/src, shell=/bin/bash, from=none /usr/src/in/srpm/rccl-2.18.6-alt0.1.src.rpm: bad symbols in the license tag: // <13>Sep 7 00:01:57 rpmi: libidn2-2.3.7-alt1 sisyphus+339505.100.1.2 1706718968 installed <13>Sep 7 00:01:57 rpmi: libnettle8-3.9.1-alt1 sisyphus+322548.100.1.2 1686176879 installed <13>Sep 7 00:01:57 rpmi: libp11-kit-1:0.25.5-alt1 sisyphus+352553.100.1.1 1720622573 installed <13>Sep 7 00:01:57 rpmi: libtasn1-4.19.0-alt3 sisyphus+327816.100.1.1 1692802615 installed <13>Sep 7 00:01:57 rpmi: libhogweed6-3.9.1-alt1 sisyphus+322548.100.1.2 1686176879 installed <13>Sep 7 00:01:57 rpmi: libgnutls30-3.8.4-alt1 sisyphus+343729.100.2.1 1711571288 installed <13>Sep 7 00:01:57 rpmi: libngtcp2.16-1.7.0-alt1 sisyphus+356415.200.1.1 1725031912 installed <13>Sep 7 00:01:57 rpmi: libngtcp2_crypto_gnutls8-1.7.0-alt1 sisyphus+356415.200.1.1 1725031912 installed <13>Sep 7 00:01:57 rpmi: cmake-modules-3.29.3-alt1 sisyphus+348648.100.2.1 1716590540 installed <13>Sep 7 00:01:57 rpmi: libuv-1.48.0-alt1 sisyphus+340945.100.1.1 1708265066 installed <13>Sep 7 00:01:57 rpmi: librhash-1.3.5-alt3 sisyphus+286141.40.2.1 1632982456 installed <13>Sep 7 00:01:57 rpmi: libjsoncpp24-1.9.4-alt2 sisyphus+346331.200.2.1 1716448551 installed <13>Sep 7 00:01:57 rpmi: libexpat-2.5.0-alt1 sisyphus+346180.200.2.1 1716349835 installed <13>Sep 7 00:01:57 rpmi: publicsuffix-list-dafsa-20240701-alt1 sisyphus+352081.100.1.1 1720015477 installed <13>Sep 7 00:01:57 rpmi: libpsl-0.21.5-alt1 sisyphus+338474.100.1.1 1705684769 installed <13>Sep 7 00:01:57 rpmi: libnghttp3.9-1.5.0-alt1 sisyphus+356415.100.1.1 1725031855 installed <13>Sep 7 00:01:57 rpmi: libnghttp2-1.63.0-alt1 sisyphus+356414.100.1.1 1725031508 installed <13>Sep 7 00:01:57 rpmi: openldap-common-2.6.8-alt1 sisyphus+351621.100.1.1 1719420449 installed <13>Sep 7 00:01:57 rpmi: libntlm-1.5-alt1 sisyphus+278100.3300.1.1 1626058899 installed <13>Sep 7 00:01:57 rpmi: libidn-1.37-alt2 sisyphus+300849.100.1.1 1653769687 installed <13>Sep 7 00:01:57 rpmi: libverto-0.3.2-alt1_1 sisyphus+321176.2200.10.2 1684803947 installed <13>Sep 7 00:01:57 rpmi: liblmdb-0.9.32-alt1 sisyphus+342426.100.1.1 1710124288 installed <13>Sep 7 00:01:57 rpmi: libkeyutils-1.6.3-alt1 sisyphus+346336.200.2.2 1716472658 installed <13>Sep 7 00:01:57 rpmi: libcom_err-1.46.4.0.5.4cda-alt1 sisyphus+283826.100.1.1 1629975345 installed <13>Sep 7 00:01:57 rpmi: libbrotlicommon-1.1.0-alt1 sisyphus+328501.100.1.1 1693598419 installed <13>Sep 7 00:01:57 rpmi: libbrotlidec-1.1.0-alt1 sisyphus+328501.100.1.1 1693598419 installed <13>Sep 7 00:01:57 rpmi: rpm-macros-cmake-3.29.1-alt1 sisyphus+344518.300.3.1 1712379787 installed <13>Sep 7 00:01:57 rpmi: rpm-macros-alternatives-0.5.2-alt2 sisyphus+315270.200.2.1 1676457367 installed <13>Sep 7 00:01:57 rpmi: alternatives-0.5.2-alt2 sisyphus+315270.200.2.1 1676457367 installed <13>Sep 7 00:01:57 rpmi: ca-certificates-2024.07.01-alt1 sisyphus+351897.100.1.1 1719826350 installed <13>Sep 7 00:01:57 rpmi: ca-trust-0.2.0-alt1 sisyphus+344843.100.1.1 1712743326 installed <13>Sep 7 00:01:57 rpmi: p11-kit-trust-1:0.25.5-alt1 sisyphus+352553.100.1.1 1720622573 installed <13>Sep 7 00:01:57 rpmi: libcrypto3-3.1.7-alt1 sisyphus+356755.100.1.1 1725388416 installed <13>Sep 7 00:01:57 rpmi: libssl3-3.1.7-alt1 sisyphus+356755.100.1.1 1725388416 installed <86>Sep 7 00:01:57 groupadd[4084553]: group added to /etc/group: name=_keytab, GID=999 <86>Sep 7 00:01:57 groupadd[4084553]: group added to /etc/gshadow: name=_keytab <86>Sep 7 00:01:57 groupadd[4084553]: new group: name=_keytab, GID=999 <13>Sep 7 00:01:57 rpmi: libkrb5-1.21.3-alt2 sisyphus+351857.100.1.1 1719735141 installed <13>Sep 7 00:01:57 rpmi: libgsasl-2.2.0-alt1 sisyphus+333173.100.1.1 1698696954 installed <86>Sep 7 00:01:57 groupadd[4084667]: group added to /etc/group: name=sasl, GID=998 <86>Sep 7 00:01:57 groupadd[4084667]: group added to /etc/gshadow: name=sasl <86>Sep 7 00:01:57 groupadd[4084667]: new group: name=sasl, GID=998 <13>Sep 7 00:01:57 rpmi: libsasl2-3-2.1.28-alt2 sisyphus+343335.100.1.1 1711112544 installed <13>Sep 7 00:01:57 rpmi: libldap2-2.6.8-alt1 sisyphus+351621.100.1.1 1719420449 installed <13>Sep 7 00:01:57 rpmi: libarchive13-3.6.1-alt2 sisyphus+324359.1300.6.1 1689326379 installed <13>Sep 7 00:01:57 rpmi: libssh2-1.11.0-alt2 sisyphus+339356.100.1.1 1706593137 installed <13>Sep 7 00:01:57 rpmi: libcurl-8.9.1-alt1 sisyphus+353987.100.1.1 1722417670 installed <13>Sep 7 00:01:58 rpmi: cmake-3.29.3-alt1 sisyphus+348648.100.2.1 1716590540 installed <13>Sep 7 00:02:51 rpmi: llvm-common-18.1.0-alt1 sisyphus+343963.100.6.1 1713343158 installed <13>Sep 7 00:02:51 rpmi: llvm-rocm-filesystem-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:02:51 rpmi: libnuma-2.0.14-alt2 sisyphus+278485.100.1.1 1626104244 installed <13>Sep 7 00:02:51 rpmi: rocm-device-libs-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:02:51 rpmi: llvm18.1-filesystem-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:02:52 rpmi: clang18.1-support-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:02:52 rpmi: llvm18.1-polly-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:02:52 rpmi: gcc-c++-common-1.4.28-alt1 sisyphus+348678.100.1.1 1716396142 installed <13>Sep 7 00:02:52 rpmi: libstdc++13-devel-13.2.1-alt4 sisyphus+354645.100.1.1 1723060849 installed <13>Sep 7 00:02:52 rpmi: librocm-smi1-6.1.2-alt0.2 sisyphus+352428.100.1.1 1720459745 installed <13>Sep 7 00:02:52 rpmi: libpciaccess-1:0.18.1-alt1 sisyphus+343583.300.1.1 1711440789 installed <13>Sep 7 00:02:52 rpmi: libdrm-1:2.4.122-alt1 sisyphus+352241.100.1.1 1720177129 installed <13>Sep 7 00:02:52 rpmi: libhsakmt1-6.1.2-alt0.1 sisyphus+352247.600.5.1 1720254766 installed <13>Sep 7 00:02:52 rpmi: libhsa-runtime1-6.1.2-alt0.1 sisyphus+352247.1600.9.1 1720269840 installed <13>Sep 7 00:02:52 rpmi: libpci-3.13.0-alt1 sisyphus+350694.100.1.1 1717993339 installed <13>Sep 7 00:02:52 rpmi: pciids-20240627-alt1 sisyphus+351710.100.1.1 1719555191 installed <13>Sep 7 00:02:52 rpmi: pciutils-3.13.0-alt1 sisyphus+350694.100.1.1 1717993339 installed <13>Sep 7 00:02:52 rpmi: libmpdec3-2.5.1-alt3 sisyphus+314490.500.5.1 1675432004 installed <13>Sep 7 00:02:52 rpmi: libgdbm-1.8.3-alt10 sisyphus+346222.200.3.2 1716468404 installed <13>Sep 7 00:02:52 rpmi: libb2-0.98.1-alt1_1 sisyphus+291614.100.1.1 1638962877 installed <13>Sep 7 00:02:53 rpmi: python3-3.12.5-alt1 sisyphus+355289.200.2.1 1723833848 installed <13>Sep 7 00:02:53 rpmi: python3-base-3.12.5-alt1 sisyphus+355289.200.2.1 1723833848 installed <13>Sep 7 00:02:54 rpmi: clang-rocm-libs-support-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:02:58 rpmi: clang-rocm-libs-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:02:58 rpmi: rocminfo-6.1.2-alt0.1 sisyphus+352247.1700.9.1 1720269882 installed <13>Sep 7 00:02:58 rpmi: libedit3-3.1.20230828-alt1 sisyphus+330914.200.3.1 1696922743 installed <13>Sep 7 00:02:58 rpmi: llvm18.1-gold-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:03:00 rpmi: llvm18.1-libs-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:03:01 rpmi: libclang-cpp18-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:03:01 rpmi: clang18.1-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:03:01 rpmi: clang-18.1.0-alt1 sisyphus+343963.100.6.1 1713343158 installed <13>Sep 7 00:03:03 rpmi: clang-rocm-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:03:05 rpmi: llvm18.1-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:03:05 rpmi: llvm-18.1.0-alt1 sisyphus+343963.100.6.1 1713343158 installed <13>Sep 7 00:03:24 rpmi: llvm-rocm-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:03:25 rpmi: libclang18-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:03:25 rpmi: clang18.1-devel-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:03:25 rpmi: clang-devel-18.1.0-alt1 sisyphus+343963.100.6.1 1713343158 installed <13>Sep 7 00:03:26 rpmi: clang18.1-tools-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:03:26 rpmi: clang-tools-18.1.0-alt1 sisyphus+343963.100.6.1 1713343158 installed <13>Sep 7 00:03:36 rpmi: clang-rocm-tools-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:03:37 rpmi: lld18.1-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:03:37 rpmi: lld-18.1.0-alt1 sisyphus+343963.100.6.1 1713343158 installed <13>Sep 7 00:03:38 rpmi: lld-rocm-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:03:40 rpmi: libamd_comgr2-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:03:41 rpmi: llvm-rocm-gold-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:03:43 rpmi: llvm-rocm-libs-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:03:43 rpmi: hip-runtime-amd-6.1.2-alt0.2 sisyphus+352364.100.1.1 1720383820 installed <13>Sep 7 00:03:43 rpmi: hipcc-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:03:47 rpmi: mlir18.1-tools-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:04:14 rpmi: llvm18.1-devel-18.1.8-alt0.1 sisyphus+351511.100.1.1 1719305993 installed <13>Sep 7 00:04:14 rpmi: llvm-devel-18.1.0-alt1 sisyphus+343963.100.6.1 1713343158 installed <13>Sep 7 00:04:33 rpmi: llvm-rocm-devel-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:04:33 rpmi: hip-devel-6.1.2-alt0.2 sisyphus+352364.100.1.1 1720383820 installed <13>Sep 7 00:04:33 rpmi: rocm-comgr-devel-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:04:48 rpmi: clang-rocm-devel-6.1.2-alt0.2 sisyphus+352528.100.1.1 1720604563 installed <13>Sep 7 00:04:49 rpmi: hipify-clang-6.1.2-alt0.1 sisyphus+352428.200.1.1 1720459887 installed <13>Sep 7 00:04:49 rpmi: hsa-rocr-devel-6.1.2-alt0.1 sisyphus+352247.1600.9.1 1720269840 installed <13>Sep 7 00:04:49 rpmi: librocm-smi-devel-6.1.2-alt0.2 sisyphus+352428.100.1.1 1720459745 installed <13>Sep 7 00:04:49 rpmi: libstdc++-devel-13-alt1 sisyphus+323337.300.1.1 1687267966 installed <13>Sep 7 00:04:49 rpmi: rocm-cmake-6.1.2-alt0.1 sisyphus+352247.100.1.1 1720180839 installed Building target platforms: x86_64 Building for target x86_64 Wrote: /usr/src/in/nosrpm/rccl-2.18.6-alt0.1.nosrc.rpm (w1.gzdio) Installing rccl-2.18.6-alt0.1.src.rpm Building target platforms: x86_64 Building for target x86_64 Executing(%prep): /bin/sh -e /usr/src/tmp/rpm-tmp.8122 + umask 022 + /bin/mkdir -p /usr/src/RPM/BUILD + cd /usr/src/RPM/BUILD + cd /usr/src/RPM/BUILD + rm -rf rccl-2.18.6 + echo 'Source #0 (rccl-2.18.6.tar):' Source #0 (rccl-2.18.6.tar): + /bin/tar -xf /usr/src/RPM/SOURCES/rccl-2.18.6.tar + cd rccl-2.18.6 + /bin/chmod -c -Rf u+rwX,go-w . + subst 's,cat ${ROCM_PATH}/.info/version,echo 6.1.2,' CMakeLists.txt + exit 0 Executing(%build): /bin/sh -e /usr/src/tmp/rpm-tmp.93728 + umask 022 + /bin/mkdir -p /usr/src/RPM/BUILD + cd /usr/src/RPM/BUILD + cd rccl-2.18.6 + export ALTWRAP_LLVM_VERSION=rocm + ALTWRAP_LLVM_VERSION=rocm + mkdir -p x86_64-alt-linux + cmake -DCMAKE_SKIP_INSTALL_RPATH:BOOL=yes '-DCMAKE_C_FLAGS:STRING=-pipe -frecord-gcc-switches -Wall -g -O2 ' '-DCMAKE_CXX_FLAGS:STRING=-pipe -frecord-gcc-switches -Wall -g -O2 ' '-DCMAKE_Fortran_FLAGS:STRING=-pipe -frecord-gcc-switches -Wall -g -O2 ' -DCMAKE_INSTALL_PREFIX=/usr -DINCLUDE_INSTALL_DIR:PATH=/usr/include -DLIB_INSTALL_DIR:PATH=/usr/lib64 -DSYSCONF_INSTALL_DIR:PATH=/etc -DSHARE_INSTALL_PREFIX:PATH=/usr/share -DLIB_DESTINATION=lib64 -DLIB_SUFFIX=64 -S . -B x86_64-alt-linux -Wno-dev -DROCM_PATH=/usr -DCMAKE_C_COMPILER=clang -DCMAKE_CXX_COMPILER=clang++ -DCMAKE_INSTALL_LIBDIR=lib64 -DENABLE_MSCCL_KERNEL=ON -- The CXX compiler identification is Clang 17.0.0 -- Detecting CXX compiler ABI info -- Detecting CXX compiler ABI info - done -- Check for working CXX compiler: /usr/bin/clang++ - skipped -- Detecting CXX compile features -- Detecting CXX compile features - done -- Could NOT find GTest (missing: GTEST_LIBRARY GTEST_INCLUDE_DIR GTEST_MAIN_LIBRARY) (Required is at least version "1.11") -- Checking for ROCm support for GPU targets: -- Performing Test COMPILER_HAS_TARGET_ID_gfx803 -- Performing Test COMPILER_HAS_TARGET_ID_gfx803 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx900_xnack_off -- Performing Test COMPILER_HAS_TARGET_ID_gfx900_xnack_off - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx906_xnack_off -- Performing Test COMPILER_HAS_TARGET_ID_gfx906_xnack_off - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx908_xnack_off -- Performing Test COMPILER_HAS_TARGET_ID_gfx908_xnack_off - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a_xnack_off -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a_xnack_off - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a_xnack_on -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a_xnack_on - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx940 -- Performing Test COMPILER_HAS_TARGET_ID_gfx940 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx941 -- Performing Test COMPILER_HAS_TARGET_ID_gfx941 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx942 -- Performing Test COMPILER_HAS_TARGET_ID_gfx942 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1030 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1030 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1100 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1100 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1101 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1101 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx1102 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1102 - Success -- Compiling for gfx803;gfx900:xnack-;gfx906:xnack-;gfx908:xnack-;gfx90a:xnack-;gfx90a:xnack+;gfx940;gfx941;gfx942;gfx1030;gfx1100;gfx1101;gfx1102 -- Could NOT find GTest (missing: GTEST_LIBRARY GTEST_INCLUDE_DIR GTEST_MAIN_LIBRARY) (Required is at least version "1.11") -- ROCM_PATH found: /usr -- Performing Test CMAKE_HAVE_LIBC_PTHREAD -- Performing Test CMAKE_HAVE_LIBC_PTHREAD - Success -- Found Threads: TRUE -- Performing Test HIP_CLANG_SUPPORTS_PARALLEL_JOBS -- Performing Test HIP_CLANG_SUPPORTS_PARALLEL_JOBS - Success -- HIP compiler: clang -- HIP runtime: rocclr -- hipcc executable: /usr/bin/hipcc -- hipcc version: 6.1.40093 -- ROCm version: 6.1.2 ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-pipe -frecord-gcc-switches -Wall -g -O2"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /usr/src/RPM/BUILD/rccl-2.18.6/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:79 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:69 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:145 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-pipe -frecord-gcc-switches -Wall -g -O2"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /usr/src/RPM/BUILD/rccl-2.18.6/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:80 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:69 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:145 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- Looking for hipEventDisableSystemFence -- Looking for hipEventDisableSystemFence - not found ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-pipe -frecord-gcc-switches -Wall -g -O2"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /usr/src/RPM/BUILD/rccl-2.18.6/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:84 (set) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_RESTORE_FLAGS) CMakeLists.txt:145 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-pipe -frecord-gcc-switches -Wall -g -O2"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /usr/src/RPM/BUILD/rccl-2.18.6/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:79 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:69 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:148 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-pipe -frecord-gcc-switches -Wall -g -O2"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /usr/src/RPM/BUILD/rccl-2.18.6/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:80 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:69 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:148 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- Looking for hipDeviceMallocUncached -- Looking for hipDeviceMallocUncached - not found ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-pipe -frecord-gcc-switches -Wall -g -O2"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /usr/src/RPM/BUILD/rccl-2.18.6/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:84 (set) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_RESTORE_FLAGS) CMakeLists.txt:148 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- HSA runtime: /usr/include -- Found rocm_smi at /usr/include -- Looking for C++ include /usr/include/rocm_smi/rocm_smi64Config.h -- Looking for C++ include /usr/include/rocm_smi/rocm_smi64Config.h - found -- Performing Test HAVE_KERNARG_PRELOAD -- Performing Test HAVE_KERNARG_PRELOAD - Success -- Kernarg preloading to SGPR enabled -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/device_table.h -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/device_table.cpp -- Generating /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/host_table.cpp -- HIP_UNCACHED_MEMORY enabled -- RCCL LL128 protocol enabled -- Building shared RCCL library -- rocm-cmake: Set license file to /usr/src/RPM/BUILD/rccl-2.18.6/LICENSE.txt. -- Configuring done (24.6s) -- Generating done (0.0s) CMake Warning: Manually-specified variables were not used by the project: CMAKE_C_COMPILER CMAKE_C_FLAGS CMAKE_Fortran_FLAGS LIB_DESTINATION LIB_SUFFIX SHARE_INSTALL_PREFIX SYSCONF_INSTALL_DIR -- Build files have been written to: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux + cmake --build x86_64-alt-linux --verbose --parallel 8 Change Dir: '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' Run Build Command(s): /usr/bin/cmake -E env VERBOSE=1 /usr/bin/gmake -f Makefile -j8 gmake: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' /usr/bin/cmake -S/usr/src/RPM/BUILD/rccl-2.18.6 -B/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux --check-build-system CMakeFiles/Makefile.cmake 0 gmake: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' /usr/bin/cmake -E cmake_progress_start /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/CMakeFiles /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux//CMakeFiles/progress.marks gmake: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' /usr/bin/gmake -f CMakeFiles/Makefile2 all /usr/bin/gmake -f CMakeFiles/git_version_check.dir/build.make CMakeFiles/git_version_check.dir/depend gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' cd /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /usr/src/RPM/BUILD/rccl-2.18.6 /usr/src/RPM/BUILD/rccl-2.18.6 /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/CMakeFiles/git_version_check.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' /usr/bin/gmake -f CMakeFiles/git_version_check.dir/build.make CMakeFiles/git_version_check.dir/build gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 0%] Updating git_version.cpp if necessary /usr/bin/cmake -P /usr/src/RPM/BUILD/rccl-2.18.6/cmake/git_version.cmake -- Updating git_version.cpp gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[1]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 0%] Built target git_version_check gmake[1]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' /usr/bin/gmake -f CMakeFiles/rccl.dir/build.make CMakeFiles/rccl.dir/depend gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 0%] Hipifying src/collectives/all_reduce.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/all_reduce.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 1%] Hipifying src/collectives/all_to_all.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/all_to_all.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 1%] Hipifying src/collectives/all_to_allv.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/all_to_allv.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 0%] Hipifying src/channel.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/channel.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 0%] Hipifying src/transport/shm.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/transport/shm.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 0%] Hipifying src/bootstrap.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/bootstrap.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 1%] Hipifying src/collectives/all_gather.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/all_gather.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 2%] Hipifying src/collectives/broadcast.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/broadcast.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 3%] Hipifying src/collectives/device/alltoall_pivot.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/alltoall_pivot.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 3%] Hipifying src/collectives/device/broadcast.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/broadcast.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 2%] Hipifying src/collectives/device/all_gather.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/all_gather.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 4%] Hipifying src/collectives/device/common_kernel.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common_kernel.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/common_kernel.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common_kernel.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 2%] Hipifying src/collectives/device/all_reduce.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/all_reduce.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 4%] Hipifying src/collectives/device/onerank_reduce.cu -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/onerank_reduce.cu.cpp mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/onerank_reduce.cu -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/onerank_reduce.cu.cpp gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 4%] Hipifying src/collectives/device/msccl_kernel_impl.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/msccl_kernel_impl.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 3%] Hipifying src/collectives/device/common.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/common.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 4%] Hipifying src/collectives/device/primitives.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/primitives.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 4%] Hipifying src/collectives/device/op128.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/op128.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/op128.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/op128.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 5%] Hipifying src/collectives/device/prims_ll.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/prims_ll.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 5%] Hipifying src/collectives/device/prims_ll128.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/prims_ll128.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 5%] Hipifying src/collectives/device/prims_simple.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/prims_simple.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 6%] Hipifying src/collectives/device/sendrecv.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/sendrecv.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 6%] Hipifying src/collectives/device/reduce_scatter.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/reduce_scatter.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 5%] Hipifying src/collectives/device/reduce_kernel.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_kernel.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/reduce_kernel.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_kernel.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 5%] Hipifying src/collectives/device/reduce.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/device/reduce.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 6%] Hipifying src/collectives/gather.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/gather.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 6%] Hipifying src/collectives/msccl.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/msccl.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 7%] Hipifying src/collectives/reduce_scatter.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/reduce_scatter.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 7%] Hipifying src/collectives/reduce.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/reduce.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 7%] Hipifying src/collectives/scatter.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/scatter.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 8%] Hipifying src/collectives/sendrecv.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/collectives/sendrecv.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 8%] Hipifying src/debug.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/debug.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 8%] Hipifying src/graph/connect.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/connect.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 9%] Hipifying src/graph/rings.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/rings.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 9%] Hipifying src/graph/paths.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/paths.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 9%] Hipifying src/graph/rings.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/rings.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 10%] Hipifying src/graph/rome_models.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/rome_models.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 8%] Hipifying src/enqueue.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/enqueue.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 9%] Hipifying src/graph/rome_models.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/rome_models.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 10%] Hipifying src/graph/search.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/search.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 10%] Hipifying src/graph/topo.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/topo.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 11%] Hipifying src/graph/trees.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/trees.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/trees.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/trees.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 10%] Hipifying src/graph/topo.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/topo.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 11%] Hipifying src/graph/tuning.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/tuning.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 12%] Hipifying src/graph/xml.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/xml.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 12%] Hipifying src/group.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/group.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 12%] Hipifying src/graph/xml.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/graph/xml.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 12%] Hipifying src/include/BfdBacktrace.hpp -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/BfdBacktrace.hpp mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/BfdBacktrace.hpp -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/BfdBacktrace.hpp gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 12%] Hipifying src/include/align.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/align.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/align.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/align.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 13%] Hipifying src/include/alloc.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/alloc.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 13%] Hipifying src/include/archinfo.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/archinfo.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/archinfo.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/archinfo.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 13%] Hipifying src/include/bootstrap.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/bootstrap.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/bootstrap.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/bootstrap.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 14%] Hipifying src/include/channel.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/channel.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 13%] Hipifying src/include/argcheck.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/argcheck.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 14%] Hipifying src/include/checks.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/checks.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 14%] Hipifying src/include/coll_net.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/coll_net.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 15%] Hipifying src/include/comm.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/comm.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 15%] Hipifying src/include/core.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/core.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 15%] Hipifying src/include/collectives.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/collectives.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/collectives.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/collectives.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 16%] Hipifying src/include/debug.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/debug.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/debug.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/debug.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 15%] Hipifying src/include/cpuset.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/cpuset.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/cpuset.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/cpuset.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 16%] Hipifying src/include/enqueue.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/enqueue.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 16%] Hipifying src/include/devcomm.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/devcomm.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/devcomm.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/devcomm.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 17%] Hipifying src/include/git_version.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/git_version.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/git_version.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/git_version.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 17%] Hipifying src/include/graph.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/graph.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 16%] Hipifying src/include/gdrwrap.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/gdrwrap.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 18%] Hipifying src/include/ibvsymbols.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvsymbols.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/ibvsymbols.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvsymbols.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 17%] Hipifying src/include/group.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/group.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 18%] Hipifying src/include/info.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/info.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 17%] Hipifying src/include/ibvcore.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvcore.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/ibvcore.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvcore.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 18%] Hipifying src/include/ibvwrap.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/ibvwrap.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 18%] Hipifying src/include/ipcsocket.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ipcsocket.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/ipcsocket.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ipcsocket.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 19%] Hipifying src/include/msccl/msccl_lifecycle.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_lifecycle.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/msccl/msccl_lifecycle.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_lifecycle.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 19%] Hipifying src/include/msccl/msccl_parser.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/msccl/msccl_parser.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 18%] Hipifying src/include/msccl/msccl_kernel.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_kernel.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/msccl/msccl_kernel.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_kernel.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 19%] Hipifying src/include/msccl/msccl_scheduler.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_scheduler.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/msccl/msccl_scheduler.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_scheduler.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 20%] Hipifying src/include/msccl/msccl_setup.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_setup.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/msccl/msccl_setup.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_setup.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 20%] Hipifying src/include/msccl/msccl_struct.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_struct.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/msccl/msccl_struct.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_struct.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 20%] Hipifying src/include/msccl/msccl_status.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_status.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/msccl/msccl_status.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_status.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 21%] Hipifying src/include/net.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/net.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 21%] Hipifying src/include/npkit/npkit_struct.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/npkit/npkit_struct.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/npkit/npkit_struct.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/npkit/npkit_struct.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 20%] Hipifying src/include/nccl_net.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nccl_net.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nccl_net.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nccl_net.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 21%] Hipifying src/include/npkit/npkit.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/npkit/npkit.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/npkit/npkit.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/npkit/npkit.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 21%] Hipifying src/include/npkit/npkit_event.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/npkit/npkit_event.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/npkit/npkit_event.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/npkit/npkit_event.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 22%] Hipifying src/include/nvmlwrap.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvmlwrap.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvmlwrap.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvmlwrap.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 22%] Hipifying src/include/nvtx3/nvToolsExtCuda.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvToolsExtCuda.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvToolsExtCuda.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvToolsExtCuda.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 22%] Hipifying src/include/nvtx.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 22%] Hipifying src/include/nvtx3/nvToolsExt.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvToolsExt.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvToolsExt.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvToolsExt.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 22%] Hipifying src/include/nvtx3/nvToolsExtCudaRt.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvToolsExtCudaRt.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvToolsExtCudaRt.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvToolsExtCudaRt.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 23%] Hipifying src/include/nvtx3/nvToolsExtOpenCL.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvToolsExtOpenCL.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvToolsExtOpenCL.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvToolsExtOpenCL.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 23%] Hipifying src/include/nvtx3/nvToolsExtPayload.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvToolsExtPayload.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvToolsExtPayload.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvToolsExtPayload.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 23%] Hipifying src/include/nvtx3/nvToolsExtSync.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvToolsExtSync.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvToolsExtSync.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvToolsExtSync.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImpl.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxImpl.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxDetail/nvtxImpl.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxImpl.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplCore.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCore.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxDetail/nvtxImplCore.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCore.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxInit.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxInit.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxDetail/nvtxInit.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxInit.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 24%] Hipifying src/include/nvtx3/nvtx3.hpp -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtx3.hpp mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtx3.hpp -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtx3.hpp gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxInitDecls.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 27%] Hipifying src/include/nvtx3/nvtxDetail/nvtxTypes.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxTypes.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxDetail/nvtxTypes.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxTypes.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 26%] Hipifying src/include/nvtx3/nvtxDetail/nvtxInitDefs.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 27%] Hipifying src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 27%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 27%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 28%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 27%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 28%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 29%] Hipifying src/include/p2p.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/p2p.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/p2p.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/p2p.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 29%] Hipifying src/include/param.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/param.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/param.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/param.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 29%] Hipifying src/include/profiler.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/profiler.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 28%] Hipifying src/include/nvtx_stub.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx_stub.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/nvtx_stub.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/nvtx_stub.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 30%] Hipifying src/include/rccl_bfloat16.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/rccl_bfloat16.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/rccl_bfloat16.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/rccl_bfloat16.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 29%] Hipifying src/include/proxy.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/proxy.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 30%] Hipifying src/include/rccl_vars.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/rccl_vars.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/rccl_vars.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/rccl_vars.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 30%] Hipifying src/include/rocm_smi_wrap.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/rocm_smi_wrap.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/rocm_smi_wrap.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/rocm_smi_wrap.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 31%] Hipifying src/include/rocmwrap.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/rocmwrap.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/rocmwrap.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/rocmwrap.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 31%] Hipifying src/include/shm.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/shm.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/shm.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/shm.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 31%] Hipifying src/include/signals.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/signals.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/signals.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/signals.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 31%] Hipifying src/include/socket.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/socket.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/socket.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/socket.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 32%] Hipifying src/include/transport.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/transport.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 32%] Hipifying src/include/trees.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/trees.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/trees.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/trees.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 32%] Hipifying src/include/timer.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/timer.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/timer.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/timer.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 32%] Hipifying src/include/strongstream.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/strongstream.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/strongstream.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/strongstream.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 33%] Hipifying src/include/utils.h -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/include/utils.h -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 33%] Hipifying src/misc/archinfo.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/archinfo.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/archinfo.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/archinfo.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 33%] Hipifying src/misc/argcheck.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/argcheck.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 34%] Hipifying src/misc/ibvsymbols.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/ibvsymbols.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 34%] Hipifying src/misc/ibvwrap.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/ibvwrap.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 34%] Hipifying src/misc/ipcsocket.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/ipcsocket.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 35%] Hipifying src/misc/msccl/msccl_lifecycle.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/msccl/msccl_lifecycle.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 33%] Hipifying src/init.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/init.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 35%] Hipifying src/misc/msccl/msccl_parser.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/msccl/msccl_parser.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 35%] Hipifying src/misc/msccl/msccl_status.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_status.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/msccl/msccl_status.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_status.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 35%] Hipifying src/misc/msccl/msccl_setup.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/msccl/msccl_setup.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 36%] Hipifying src/misc/npkit.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/npkit.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 36%] Hipifying src/misc/profiler.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/profiler.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 36%] Hipifying src/misc/param.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/param.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/param.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/param.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 36%] Hipifying src/misc/nvmlwrap_stub.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/nvmlwrap_stub.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/nvmlwrap_stub.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/nvmlwrap_stub.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 37%] Hipifying src/misc/rocm_smi_wrap.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/rocm_smi_wrap.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 37%] Hipifying src/misc/rocmwrap.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocmwrap.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/rocmwrap.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocmwrap.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 37%] Hipifying src/misc/shmutils.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/shmutils.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 37%] Hipifying src/misc/signals.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/signals.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/signals.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/signals.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 38%] Hipifying src/misc/socket.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/socket.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 38%] Hipifying src/misc/strongstream.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/strongstream.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/strongstream.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/strongstream.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 38%] Hipifying src/misc/utils.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/misc/utils.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 39%] Hipifying src/net.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/net.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 39%] Hipifying src/transport.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/transport.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 39%] Hipifying src/proxy.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/proxy.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 39%] Hipifying src/transport/coll_net.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/transport/coll_net.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 40%] Hipifying src/transport/net_socket.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/transport/net_socket.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 40%] Hipifying src/transport/nvls.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/transport/nvls.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 40%] Hipifying src/transport/net.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/transport/net.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 40%] Hipifying src/transport/net_ib.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/transport/net_ib.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 41%] Hipifying src/transport/p2p.cc -> /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc mkdir -p /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /usr/src/RPM/BUILD/rccl-2.18.6/src/transport/p2p.cc -o /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' cd /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /usr/src/RPM/BUILD/rccl-2.18.6 /usr/src/RPM/BUILD/rccl-2.18.6 /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/CMakeFiles/rccl.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' /usr/bin/gmake -f CMakeFiles/rccl.dir/build.make CMakeFiles/rccl.dir/build gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 43%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/all_to_all.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/all_to_all.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/all_to_all.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/all_to_all.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx1101. 5 warnings generated when compiling for gfx803. 5 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_all.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx942. 5 warnings generated when compiling for gfx1030. 5 warnings generated when compiling for gfx908. 5 warnings generated when compiling for gfx906. 5 warnings generated when compiling for gfx1102. 5 warnings generated when compiling for gfx941. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 43%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/all_to_allv.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/all_to_allv.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/all_to_allv.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/all_to_allv.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_to_allv.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 42%] Building CXX object CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx942. 1 warning generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/bootstrap.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx1100. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 43%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/all_reduce.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/all_reduce.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/all_reduce.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/all_reduce.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx942. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for host. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx941. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx803. 3 warnings generated when compiling for gfx90a. 3 warnings generated when compiling for gfx940. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:22:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 22 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:27:23: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx1100. 3 warnings generated when compiling for gfx908. 3 warnings generated when compiling for gfx1030. 3 warnings generated when compiling for gfx906. 3 warnings generated when compiling for gfx900. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 42%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/all_gather.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/all_gather.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/all_gather.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/all_gather.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for host. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ 3 warnings generated when compiling for gfx942. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ 3 warnings generated when compiling for gfx1030. 3 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:18:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 18 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:21:10: warning: unused variable 'msgsize' [-Wunused-variable] 21 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ 3 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/all_gather.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx1100. 3 warnings generated when compiling for gfx906. 3 warnings generated when compiling for gfx940. 3 warnings generated when compiling for gfx90a. 3 warnings generated when compiling for gfx941. 3 warnings generated when compiling for gfx1101. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/msccl.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/msccl.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/msccl.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/msccl.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx942. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 4 warnings generated when compiling for host. 4 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx1030. 4 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/msccl.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx90a. 4 warnings generated when compiling for gfx1101. 4 warnings generated when compiling for gfx90a. 4 warnings generated when compiling for gfx900. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 42%] Building CXX object CMakeFiles/rccl.dir/hipify/src/channel.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/channel.cc.o -MF CMakeFiles/rccl.dir/hipify/src/channel.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/channel.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 8 warnings generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx942. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 8 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 8 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/channel.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx941. 8 warnings generated when compiling for gfx1100. 8 warnings generated when compiling for gfx803. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 43%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/broadcast.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/broadcast.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/broadcast.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/broadcast.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx941. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx908. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx906. 3 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for host. 3 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ 3 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ 3 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx1030. 3 warnings generated when compiling for gfx803. 3 warnings generated when compiling for gfx90a. 3 warnings generated when compiling for gfx940. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:21:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 21 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:25:23: warning: unused variable 'payload' [-Wunused-variable] 25 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/broadcast.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/gather.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/gather.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/gather.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/gather.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/gather.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx942. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx906. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/debug.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/debug.cc.o -MF CMakeFiles/rccl.dir/hipify/src/debug.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/debug.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/debug.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx942. 1 warning generated when compiling for gfx1030. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/scatter.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/scatter.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/scatter.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/scatter.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/scatter.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx942. 1 warning generated when compiling for gfx900. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/reduce_scatter.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/reduce_scatter.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/reduce_scatter.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/reduce_scatter.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx908. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ 3 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx1102. 3 warnings generated when compiling for gfx90a. 3 warnings generated when compiling for gfx941. 3 warnings generated when compiling for gfx940. 3 warnings generated when compiling for gfx1100. 3 warnings generated when compiling for gfx1101. 3 warnings generated when compiling for gfx1030. 3 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:22:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:27:27: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce_scatter.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/sendrecv.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/sendrecv.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/sendrecv.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/sendrecv.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ 4 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx1100. 4 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx942. 4 warnings generated when compiling for gfx940. 4 warnings generated when compiling for gfx1102. 4 warnings generated when compiling for gfx803. 4 warnings generated when compiling for gfx941. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:27:22: warning: unused variable 'payload' [-Wunused-variable] 27 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:50:22: warning: unused variable 'payload' [-Wunused-variable] 50 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/sendrecv.cc:18:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 18 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 4 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/reduce.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/reduce.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/reduce.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/reduce.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx900. 3 warnings generated when compiling for gfx1101. 3 warnings generated when compiling for gfx941. 3 warnings generated when compiling for gfx1100. 3 warnings generated when compiling for gfx906. 3 warnings generated when compiling for gfx940. 3 warnings generated when compiling for gfx1030. 3 warnings generated when compiling for gfx803. 3 warnings generated when compiling for gfx1102. 3 warnings generated when compiling for gfx908. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx942. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:23:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 23 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:29:20: warning: unused variable 'payload' [-Wunused-variable] 29 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/reduce.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/enqueue.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ 7 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ 7 warnings generated when compiling for host. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ 7 warnings generated when compiling for gfx942. 7 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:104:12: warning: unused variable 'y' [-Wunused-variable] 104 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:111:7: warning: unused variable 'localRanks' [-Wunused-variable] 111 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/connect.cc:230:21: warning: unused function 'getIndexes' [-Wunused-function] 230 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1030. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 20 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 20 warnings generated when compiling for gfx803. 20 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ 20 warnings generated when compiling for gfx942. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 20 warnings generated when compiling for gfx90a. 20 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 20 warnings generated when compiling for gfx908. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ 20 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ 20 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/paths.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 20 warnings generated when compiling for gfx1100. 20 warnings generated when compiling for gfx906. 20 warnings generated when compiling for gfx941. 20 warnings generated when compiling for gfx90a. 20 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/onerank_reduce.cu.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/onerank_reduce.cu.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/onerank_reduce.cu.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/onerank_reduce.cu.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/onerank_reduce.cu.cpp gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rings.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. 1 warning generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ 28 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 28 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, cIn file included from o/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.ccn:s22t: In file included from c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.hh:a60r: *In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.ha:t14t: r/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.hV:a40l:u13e:) warning: {unused function 'log2i' [-Wunused-function] | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: 40unused function 'xmlSetAttr' [-Wunused-function] | static l144o | nsgt altoigc2 in(clcolnRge snu)l t{_ t | x ^~~~~m lSetAttr(structIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.ccn:c24c: l/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.hX:m206l:N21o:d ewarning: *unused function 'ncclTopoRankToIndex' [-Wunused-function] node, co n206s | ts tcahtairc* nactctlrRNeasmuel,t _cto nnsctc lcThoapro*R avnaklTuoeI)n d{e x (| s ^~~~~~~~~~t ru/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.hc:t157 :n21c:c lwarning: Tunused function 'xmlSetAttrIfUnset' [-Wunused-function]o poSystem *157 | ssytsatteimc, nicnctl Rreasnukl,t _itn tx*m liSnedteAxt)t r{I f U| n ^~~~~~~~~~~~~~~~~~~s et(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.hs:t217r:u21c:t warning: nunused function 'ncclTopoDevToRank' [-Wunused-function]c clXmlNo d217e | *s tnaotdiec, nccocnlsRte scuhlatr_*t antctcrlNTaompeo,D ecvoTnosRta nckh(asrt*r uvcatl unec)c l{T o p| o ^~~~~~~~~~~~~~~~~S ys/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.ht:e169m:*21 :s ywarning: sunused function 'xmlSetAttrInt' [-Wunused-function]t em, int 169d | esvt,a tiinct *n crcalnRke)s u{l t _| t ^~~~~~~~~~~~~~~~~ xmlSIn file included from e/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cct:A25t: t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.hr:I94n:t21(:s twarning: runused function 'xmlGetAttrInt' [-Wunused-function]u ct ncclX m94l | Nsotdaet*i cn ondcec,l Rceosnusltt _cth axrm*l GaetttArtNtarmIen,t c(osntsrtu citn tn cvcallXumel)N o{d e *| ^~~~~~~~~~~~~n od/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.he:,182 :c21o:n swarning: tunused function 'xmlSetAttrFloat' [-Wunused-function] char* a t182t | rsNtaamtei,c innctc*l Rveasluulet)_ t{ x m| lS ^~~~~~~~~~~~~e tAt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.ht:r101F:l21o:a twarning: (unused function 'xmlGetAttrIntDefault' [-Wunused-function]s truct ncc l101X | msltNaotdiec* nncocdleR,e scuolnts_tt cxhmalrG*e taAttttrrNIanmteD,e fcaounlstt( sftlrouactt vnaclculeX)m l{N o d| ^~~~~~~~~~~~~~~e * n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.ho:d195e:,21 :c owarning: nunused function 'xmlUnsetAttr' [-Wunused-function]s t char *195 | astttartNiacm en,c cilnRte*s uvlatl_ute ,x milnUtn sdeetfAatutlrt(Vsatlruuec)t {n c c| l ^~~~~~~~~~~~~~~~~~~~X ml/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.hN:o109d:e21*: nwarning: ounused function 'xmlGetAttrFloat' [-Wunused-function]d e, cons t109 | cshtaart*i ca tntcrcNlaRmees)u l{t _ t| ^~~~~~~~~~~~x ml/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.hG:e207t:A21t:t rwarning: Funused function 'xmlGetSub' [-Wunused-function]l oat(str u207c | ts tnactcilcX mnlcNcoldRee*s nuoldte_,t cxomnlsGte tcShuabr(*s tartutcrtN anmcec,l XfmlloNaotd*e *v anloudee), {c o n| s ^~~~~~~~~~~~~~~t c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.hh:a116r:*21 :s uwarning: bunused function 'xmlFindTag' [-Wunused-function]N ame, st r116u | cstt antciccl XnmclcNloRdees*u*l ts_utb )x m{l F i| n ^~~~~~~~~d Ta/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.hg:(233s:t21r:u cwarning: tunused function 'xmlGetSubKvInt' [-Wunused-function] ncclXml* xm l233, | sctoantsitc cnhcacrl*R etsauglNatm_et, xsmtlrGuecttS unbcKcvlIXnmtl(Nsotdreu*c*t nnocdcel)X m{l N o| d ^~~~~~~~~~e * /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.hn:o128d:e21,: cwarning: ounused function 'xmlFindTagKv' [-Wunused-function]n st char* s u128b | Nsatmea,t isct rnuccctl RnecscullXtm_ltN oxdmel*F*i nsduTba,g Kcvo(nssttr ucchta rn*c caltXtmrlN*a mxem,l ,c ocnosnts ti ncth aart*t rtVaaglNuaem)e ,{ s t| r ^~~~~~~~~~~~~~u ct/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h :n240c:c21l:X mwarning: lunused function 'xmlAddNode' [-Wunused-function]N ode** no d240e | ,s tcaotnisct ncchcalrR*e sualttt_rtN axmmel,A ddcNoondset( scthraurc*t antctcrlVXamllu*e )x m{l , | s ^~~~~~~~~~~~tr uct/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h :n144c:c21l:X mwarning: lunused function 'xmlSetAttr' [-Wunused-function]N ode* pa r144e | nstt,a tciocn sntc cclhRaers*u lstu_btN axmmel,S esttArtutcrt( sntcrculcXtm lnNcocdleX*m*l Nsoudbe)* {n o d| e ^~~~~~~~~~, c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.ho:n256s:t21 :c hwarning: aunused function 'xmlRemoveNode' [-Wunused-function]r * att r256N | asmtea,t icco nnsctc lcRheasru*l tv_atl uxem)l R{e m o| v ^~~~~~~~~~e No/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.hd:e157(:s21t:r uwarning: cunused function 'xmlSetAttrIfUnset' [-Wunused-function]t ncclXm l157N | osdtea*t inco dnec)c l{R e s| u ^~~~~~~~~~~~~l t_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.ht: 276x:m21l:S ewarning: unused function 'kvConvertToInt' [-Wunused-function]t AttrIf U276n | ssetta(tsitcr uncctc lnRcecsluXlmtl_Nto dkev*C onnovdeer,t TcooInnstt( ccohnasrt* cahtatrr*N asmter,, cionnts*t vcahlaure*, vsatlruuec)t {k v D| i ^~~~~~~~~~~~~~~~~c t*/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h :d169i:c21t:) warning: {unused function 'xmlSetAttrInt' [-Wunused-function] | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h :169289 | :s21t:a twarning: iunused function 'kvConvertToStr' [-Wunused-function]c ncclR e289s | usltta_tti cx mnclcSleRteAstutlrtI_ntt (ksvtCrouncvte rntcTcolSXtmrl(Niondte *v anloudee,, ccoonnsst tc hcahra*r** sattrt,r Nsatmreu,c tc oknvsDti citn*t dviacltu)e ){ { | ^~~~~~~~~~~~~~| ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 28 warnings generated when compiling for gfx941. 28 warnings generated when compiling for gfx900. 28 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 28 warnings generated when compiling for gfx940. 28 warnings generated when compiling for gfx1101. 28 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ de* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 28 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:773:7: warning: unused variable 'nChannels' [-Wunused-variable] 773 | int nChannels = 0; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:783:12: warning: unused variable 'y' [-Wunused-variable] 783 | int x=0, y=0; | ^ 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1238:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1238 | static char ringRemap[64]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1242:7: warning: unused variable 'ncpus' [-Wunused-variable] 1242 | int ncpus = system->nodes[CPU].count; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1327:9: warning: unused variable 't' [-Wunused-variable] 1327 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1364:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1364 | static char ringRemap[256]; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1385:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1385 | int gcnt = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1460:9: warning: unused variable 't' [-Wunused-variable] 1460 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:1499:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1499 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:22: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:24: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/rome_models.cc:25: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 28 warnings generated when compiling for gfx1100. 28 warnings generated when compiling for gfx908. 28 warnings generated when compiling for gfx942. 28 warnings generated when compiling for gfx90a. 28 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/trees.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 8 warnings generated when compiling for gfx90a. 8 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 8 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 8 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx941. 8 warnings generated when compiling for gfx1102. 8 warnings generated when compiling for gfx1030. 8 warnings generated when compiling for gfx900. 8 warnings generated when compiling for gfx940. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx1101. 8 warnings generated when compiling for host. 8 warnings generated when compiling for gfx1100. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:7: warning: variable 'devIndex' is used uninitialized whenever 'if' condition is false [-Wsometimes-uninitialized] 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:798:41: note: uninitialized use occurs here 798 | NCCLCHECK(ncclTopoGetXmlFromGpu(node, devIndex, xml, gpuNode)); | ^~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/checks.h:108:22: note: expanded from macro 'NCCLCHECK' 108 | ncclResult_t RES = call; \ | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:795:3: note: remove the 'if' if its condition is always true 795 | if (rocmsmiInit == 1) { | ^~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:790:20: note: initialize the variable 'devIndex' to silence this warning 790 | uint32_t devIndex; | ^ | = 0 In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.cc:15: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 8 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 10 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 10 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 10 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 10 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 10 warnings generated when compiling for gfx908. 10 warnings generated when compiling for gfx941. 10 warnings generated when compiling for gfx1102. 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 10 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 10 warnings generated when compiling for gfx90a. 10 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/search.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 10 warnings generated when compiling for gfx942. 10 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o -MF CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 28 warnings generated when compiling for gfx906. 28 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 28 warnings generated when compiling for gfx941. 28 warnings generated when compiling for gfx1102. 28 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 28 warnings generated when compiling for gfx940. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct nIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ cclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:330:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 330 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 28 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:20: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:368:3: note: expanded from macro 'IMPL_MAIN_KERN' 368 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:294:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 294 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:32:1: note: in instantiation of function template specialization 'ncclKernel' requested here 32 | IMPL_MAIN_KERN(); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:373:3: note: expanded from macro 'IMPL_MAIN_KERN' 373 | ncclKernel(comm, channelMask, workHead); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:298:34: note: uninitialized use occurs here 298 | copyToShmem16(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:271:14: note: initialize the variable 'dst' to silence this warning 271 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/enqueue.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:206:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 206 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 28 warnings generated when compiling for gfx90a. 28 warnings generated when compiling for host. 28 warnings generated when compiling for gfx803. 28 warnings generated when compiling for gfx1100. 28 warnings generated when compiling for gfx90a. 28 warnings generated when compiling for gfx900. 28 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx940. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ 9 warnings generated when compiling for gfx908. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx803. 9 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx941. 9 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ 9 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/tuning.cc:11: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx942. 9 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx941. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data,In file included from size, m/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cch:a8n: dIn file included from l/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.he:,60 : rIn file included from e/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.hq:u14e: st/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h):)40;: 13r:e twarning: uunused function 'log2i' [-Wunused-function]r n ncclSuccess; } | ^~~~~~~~~~~~~ 40/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h | :s29t:a21t:i cwarning: unused function 'collNetTest' [-Wunused-function]l ong log2i(l o29n | gs tna)t i{c n| c ^~~~~c lResult_t collNetTest(struct In file included from n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.ccc:c10l: C/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.ho:m217m:*21 :c owarning: munused function 'ncclTopoDevToRank' [-Wunused-function]m , void* r217e | qsuteastti,c innctc*l Rdeosnuel,t _itn tn*c csliTzoep)o D{e vNTCoCRLaCnHkE(CsKt(rcuocmtm -n>cncclcTloCpoolSlyNsette-m>*t essyts(treemq,u eisntt, ddeovn,e ,i nsti*z er)a)n;k )r e{t u r| n ^~~~~~~~~~~~~~~~~ ncclSucIn file included from c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cce:s14s: ;/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h :}16 : 20| : ^~~~~~~~~~~ warning: unused function 'collNetName' [-Wunused-function] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function]16 | static co n30s | ts tcahtairc* nccoclllRNeestuNlatm_et( sctorlulcNte tnCclcolsCeoCmoml*l (csotmrmu)c t{ nrcectluCronm mc*o mcmo-m>mn,c cvloCiodl*l Nceotl-l>Cnoammme); {} N C| C ^~~~~~~~~~~L CHE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.hC:K19(:c21o:m mwarning: -unused function 'collNetListen' [-Wunused-function]> ncclCollNet- >19c | lsotsaetCiocl ln(cccollRleCsoumlmt)_)t; croeltluNrent LnicsctleSnu(csctersusc;t }n c c| l ^~~~~~~~~~~~~~~~C om/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.hm:*31 :c21o:m mwarning: ,unused function 'collNetCloseListen' [-Wunused-function] int dev, v o31i | ds*t ahtaincd lnec,c lvRoeisdu*l*t _lti sctoelnlCNoemtmC)l o{s eNLCiCsLtCeHnE(CsKt(rcuocmtm -n>cncclcCloCmoml*l Nceotm-m>,l ivsotiedn*( dleivs,t ehnaCnodmlme), {l iNsCtCeLnCCHoEmCmK)()c;o mrme-t>unrcnc lnCcoclllSNuectc-e>scsl;o s}e L i| s ^~~~~~~~~~~~~t en/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h(:l20i:s21t:e nwarning: Cunused function 'collNetConnect' [-Wunused-function]o mm)); return nccl S20u | cscteastsi;c }n c c| l ^~~~~~~~~~~~~~~~~~R esult_t collNeIn file included from t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.ccC:o17n: n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.he:c128t:(21s:t rwarning: uunused function 'xmlFindTagKv' [-Wunused-function]c t ncclComm* c128o | msmt,a tvioci dn*c chlaRnedsluelst[_]t, ximnltF innrdaTnakgsK,v (isnttr urcatn kn,c cvloXimdl** lximslt,e ncCoonmsmt, cvhoaird** *t acgoNlalmCeo,m ms)t r{u cNtC CnLcCcHlEXCmKl(Ncoodmem*-*> nncocdleC,o lcloNnestt- >cchoanrn*e catt(thraNnadmlee,s ,c onnrsatn kcsh,a rr*a nakt,t rlViasltueen)C o{m m ,| ^~~~~~~~~~~~c oll/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.hC:o144m:m21):) ;warning: unused function 'xmlSetAttr' [-Wunused-function]r eturn nc c144l | Ssutcacteiscs ;n c}c l R| e ^~~~~~~~~~~~~~s ult/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h_:t21 :x21m:l Swarning: eunused function 'collNetReduceSupport' [-Wunused-function]t Attr(struct nc c21l | XsmtlaNtoidce *n cncoldRee,s uclotn_stt ccohlalrN*e taRtetdruNcaemSeu,p pcoornts(ts tcrhuacrt* nvcaclluCeo)m m{* c| o ^~~~~~~~~~m m,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h :n157c:c21l:D awarning: tunused function 'xmlSetAttrIfUnset' [-Wunused-function]a Type_t d a157t | asTtyaptei,c nnccccllRReedsOupl_tt_ tr exdmOlpS,e tiAnttt*r IsfuUpnpsoertt(esdt)r u{c tN CnCcLcClHXEmClKN(ocdoem*m -n>ondcec,l CcoolnlsNte tc-h>arre*d uactetSruNpapmoer,t (cdoantsatT ycphe, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ ar* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx908. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ 23 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx940. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx1100. 23 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ 23 warnings generated when compiling for gfx803. 23 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx1102. 23 warnings generated when compiling for gfx90a. 23 warnings generated when compiling for gfx90a. 23 warnings generated when compiling for gfx942. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:865:19: warning: variable 'cId' set but not used [-Wunused-but-set-variable] 865 | int gIndex = 0, cId = 0, n = 0; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:10: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/group.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/group.cc.o -MF CMakeFiles/rccl.dir/hipify/src/group.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/group.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx1030. 2 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx1102. 2 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx908. 2 warnings generated when compiling for gfx1101. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx90a. 2 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/group.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/group.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx942. 2 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvsymbols.cc:64: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. 1 warning generated when compiling for host. 1 warning generated when compiling for gfx941. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/archinfo.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/argcheck.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/argcheck.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ipcsocket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. 1 warning generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/ibvwrap.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/ibvwrap.h:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. 1 warning generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ 3 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ 3 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx906. 3 warnings generated when compiling for gfx941. 3 warnings generated when compiling for gfx1100. 3 warnings generated when compiling for gfx1101. 3 warnings generated when compiling for gfx90a. 3 warnings generated when compiling for gfx90a. 3 warnings generated when compiling for gfx908. 3 warnings generated when compiling for gfx940. 3 warnings generated when compiling for gfx803. 3 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for gfx942. 3 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/init.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/init.cc.o -MF CMakeFiles/rccl.dir/hipify/src/init.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/init.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 45 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 45 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.ccl:l2311N:e26t:- >warning: cunused variable 'payload' [-Wunused-variable]l oseColl(co l2311l | C o mNmv)t)x;P arreatmusrCno mnmcIcnliStuRcacneks sp;a y}l o a| d ^~~~~~~~~~~~~~~~{ ran/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.hk:,31 :n21:r warning: aunused function 'collNetCloseListen' [-Wunused-function]n ks, cudaDev }31; | s t| a ^~~~~~~t ic ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrN/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cca:m2341e:,26 :i nwarning: tunused variable 'payload' [-Wunused-variable]* value, i2341n | t dNevftaxuPlatrVaamlsuCeo)m m{I n i| t ^~~~~~~~~~~~~~~~~~~~R ank/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h :p109a:y21l:o awarning: dunused function 'xmlGetAttrFloat' [-Wunused-function]{ rank, nr a109n | ksst,a tciucd anDcecvl}R;e s u| l ^~~~~~~t _t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct nc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.ccc:l2009X:m38l:N ode* node,warning: unused variable 'CommInitAllSchema' [-Wunused-variable]c onst char* attr N2009a | m e ,c ocnosntsetx pcrh anrv*t xvPaalyuleo)a d{S c h| e ^~~~~~~~~~~~~~~~~m aEn/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.ht:r169y:_21t: Cwarning: ounused function 'xmlSetAttrInt' [-Wunused-function]m mInitAl l169S | cshteamtai[c] n=c c{l R e| s ^~~~~~~~~~~~~~~~~u lt_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* ha/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ ndle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(i/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ nt value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ 45 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return nc45clSuccess; warning s} generated when compiling for | gfx941 ^~~~~~~~~~~~~~~~~~. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t In file included from xmlSetAt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cct:r10I: nIn file included from t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h(:s9t: rIn file included from u/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.hc:t11 : nIn file included from c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.hc:l12X: mIn file included from l/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.hN:o124d: eIn file included from */usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h :n14o: dIn file included from e/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h,: 60c: oIn file included from n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.hs:t14 : ch/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.ha:r40*: 13a:t twarning: runused function 'log2i' [-Wunused-function]N ame, const int value) 40{ | s t| a ^~~~~~~~~~~~~t ic /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.hl:o182n:g21 :l owarning: gunused function 'xmlSetAttrFloat' [-Wunused-function]2 i(long n182) | s{t a t| i ^~~~~c ncclResult_t xmlSetAttrFloat(strucIn file included from t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc :n17c: c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.hl:X16m:l20N:o dwarning: eunused function 'collNetName' [-Wunused-function]* node, c o16n | sstt acthiacr *c oantsttr Ncahmaer,* ccoonlsltN eftlNoaamte (vsatlruuec)t {n c c| l ^~~~~~~~~~~~~~~C om/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.hm:*195 :c21o:m mwarning: )unused function 'xmlUnsetAttr' [-Wunused-function] { retur n195 | csotmamt-i>cn cncclcCloRlelsNueltt-_>tn axmmel;U n}s e t| A ^~~~~~~~~~~t tr(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.hs:t17r:u21c:t warning: nunused function 'collNetDevices' [-Wunused-function]c clXmlNode *17 | nsotdaet,i cc onncsctl Rcehsaurl*t _att tcroNlalmNee)t D{e v i| c ^~~~~~~~~~~~e s(s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.ht:r207u:c21t: nwarning: cunused function 'xmlGetSub' [-Wunused-function]c lComm* c207o | msmt,a tiinct *n cncdleRve)s u{l tN_CtC LxCmHlEGCeKt(Scuobm(ms-t>rnuccctl CnoclcllNXemtl-N>oddeev*i cneosd(en,d ecvo)n)s;t rcehtaurr*n snucbcNlaSmuec,c esstsr;u c}t n| c ^~~~~~~~~~~~~~c lX/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.hm:l18N:o21d:e *warning: *unused function 'collNetGetProperties' [-Wunused-function] sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h18: | 233s:t21a:t iwarning: cunused function 'xmlGetSubKvInt' [-Wunused-function] ncclResult _233t | sctoaltliNc ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ etGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 45 warnings generated when compiling for gfx1102. 45 warnings generated when compiling for gfx90a. 45 warnings generated when compiling for gfx906. 45 warnings generated when compiling for gfx90a. 45 warnings generated when compiling for gfx1101. 45 warnings generated when compiling for gfx1100. 45 warnings generated when compiling for gfx803. 45 warnings generated when compiling for gfx942. 45 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1675:11: warning: unused variable 'stackSize' [-Wunused-variable] 1675 | int64_t stackSize; | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1676:19: warning: unused variable 'devProp' [-Wunused-variable] 1676 | hipDeviceProp_t devProp; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1995:26: warning: unused variable 'payload' [-Wunused-variable] 1995 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2009:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2009 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2311:26: warning: unused variable 'payload' [-Wunused-variable] 2311 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:2341:26: warning: unused variable 'payload' [-Wunused-variable] 2341 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:37: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:38: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:782:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 782 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/init.cc:1980:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 1980 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 45 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_status.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx1100. 4 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx1030. 4 warnings generated when compiling for gfx941. 4 warnings generated when compiling for gfx900. 4 warnings generated when compiling for gfx908. 4 warnings generated when compiling for gfx906. 4 warnings generated when compiling for gfx90a. 4 warnings generated when compiling for gfx1101. 4 warnings generated when compiling for gfx940. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:76:16: warning: unused variable 'status' [-Wunused-variable] 76 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:132:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 132 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_setup.cc:6: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx942. 4 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/nvmlwrap_stub.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/npkit.cc:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/param.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx908. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx906. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx900. 9 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx942. 9 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/profiler.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/profiler.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/proxy.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocm_smi_wrap.cc:23: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. 1 warning generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/rocmwrap.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/signals.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/shmutils.cc:17: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/utils.cc:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/strongstream.cc gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/misc/socket.cc:8: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. 1 warning generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/net.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/net.cc.o -MF CMakeFiles/rccl.dir/hipify/src/net.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/net.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/net.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. 1 warning generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/proxy.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/proxy.cc.o -MF CMakeFiles/rccl.dir/hipify/src/proxy.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/proxy.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/proxy.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. 1 warning generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_socket.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. 1 warning generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx941. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/nvls.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 21 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from 21 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct c21 warnings generated when compiling for gfx940. onnectMap* map) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ 21 warnings generated when compiling for gfx908. 21 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ 21 warnings generated when compiling for gfx900. 21 warnings generated when compiling for gfx1101. 21 warnings generated when compiling for gfx1102. 21 warnings generated when compiling for gfx90a. 21 warnings generated when compiling for gfx941. 21 warnings generated when compiling for gfx1030. 21 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:9: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, int size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, int size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:12: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ 21 warnings generated when compiling for gfx942. 21 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 17 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx803. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 17 warnings generated when compiling for gfx942. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net_ib.cc:28: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 17 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/net.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 11 warnings generated when compiling for gfx1102. 11 warnings generated when compiling for gfx940. 11 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 11 warnings generated when compiling for gfx1030. 11 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 11 warnings generated when compiling for gfx941. 11 warnings generated when compiling for gfx906. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx803. 11 warnings generated when compiling for gfx900. 11 warnings generated when compiling for gfx90a. 11 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:201:19: warning: unused variable 'md' [-Wunused-variable] 201 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:19: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/net.cc:265:21: warning: unused function 'netDumpMap' [-Wunused-function] 265 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 11 warnings generated when compiling for gfx942. 11 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx90a. 5 warnings generated when compiling for gfx940. 5 warnings generated when compiling for gfx906. 5 warnings generated when compiling for gfx908. 5 warnings generated when compiling for gfx90a. 5 warnings generated when compiling for gfx941. 5 warnings generated when compiling for gfx1102. 5 warnings generated when compiling for gfx803. 5 warnings generated when compiling for gfx900. 5 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:8: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/p2p.cc:13: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:195:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 195 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:206:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 206 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:217:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 217 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/graph/topo.h:229:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 229 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx942. 5 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx940. 1 warning generated when compiling for gfx90a. 1 warning generated when compiling for gfx900. 1 warning generated when compiling for gfx1030. 1 warning generated when compiling for gfx803. 1 warning generated when compiling for gfx1101. 1 warning generated when compiling for gfx1102. 1 warning generated when compiling for gfx906. 1 warning generated when compiling for gfx908. 1 warning generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/transport/shm.cc:7: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/comm.h:11: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/transport.h:12: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/graph.h:124: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/info.h:14: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/core.h:60: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/alloc.h:14: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include/utils.h:40:13: warning: unused function 'log2i' [-Wunused-function] 40 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. 1 warning generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:187:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 187 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllGather, RING, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:187:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 187 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllGather, RING, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx900. 8 warnings generated when compiling for gfx90a. 8 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 8 warnings generated when compiling for gfx803. 8 warnings generated when compiling for gfx908. 8 warnings generated when compiling for gfx906. 8 warnings generated when compiling for gfx90a. 8 warnings generated when compiling for gfx1101. 8 warnings generated when compiling for gfx1102. 8 warnings generated when compiling for gfx900. 8 warnings generated when compiling for gfx1100. 8 warnings generated when compiling for gfx941. 8 warnings generated when compiling for gfx1030. 8 warnings generated when compiling for gfx940. 8 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_gather.h:173:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 173 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllGather, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 8 warnings generated when compiling for host. 8 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h ^~~~~: 514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE7 warnings generated when compiling for gfx908. , LL128, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 37 warnings generated when compiling for gfx90a. 37 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthrIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ eads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Pr 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ od, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx942. 7 warnings generated when compiling for host. 37 warnings generated when compiling for gfx90a. 37 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 25 warnings generated when compiling for gfx90a. 25 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2,7 warnings generated when compiling for gfx908. flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, 7 warnings generated when compiling for gfx1030. LL128, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMax<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMax<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMax<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMax<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMax<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMax<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 37 warnings generated when compiling for gfx90a. 37 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMin<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMin<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMin<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMin<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMin<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMin<__half>, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ zeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit7, warning s& generatedt when compiling for rgfx1030e. e->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 37 warnings generated when compiling for gfx90a. 37 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlocIn file included from k/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp(:t1h: rIn file included from e/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ha:d10I: dIn file included from x/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h.:x169/: W/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.hA:R509P:_29S:I Zwarning: Efield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]) , | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | 507f | l a g T htrieda(dt(i(dt)i,d %n4t)h=r=e3a)d,s (gnrtohurpe(agdrso)u,p )w,i d (| t ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~i d %| W warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3A RP_SIZ E510) | , w a rspt(etpiSdi/zWeA(RnPc_cSlISZhEm)e,m . c| o ~~~~~~~~~~~~~~~~~~m m .| b stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)u ffSiz e508s | [ N C C Lw_aPrRpOITnOB_lLoLc1k2(8t]h/rNeCaCdLI_dSxT.ExP/SW/AsRiPz_eSoIfZ(Eu)i,n t 6| 4 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~_ t )| ) warp(tid/WARP_SIZE { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 509 | | group(group flagThread((ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hd:%4514:)9=:= 3note: )in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here, group( g451r | o u p ) prims(tid, nthreads, ,t r e| e ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~- > d| o warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3w n, tree -510> | d o w n ,s taerpgSsi-z>es(enncdcbluSfhfm,e ma.rcgosm-m>.rbeucfvfbSuifzfe,s [aNrCgCsL-_>PrReOdTOOp_ALrLg1)2;8 ] /| N ^C CL_STE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hP:S994/:s5i:z enote: oin instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested heref (uin t9946 | 4 _ t ) )r u{n T r| e ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~e S p| l group(groupi t (note: ain instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested herer gs); | ^ 491 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 202 : 53p:r inote: min instantiation of member function 'RunWorkElement, 0, 1>::run' requested heres (tid, 202n | t h r e a d s S pRluintW,o rtkrEelee-m>ednotwduOpp,, aArlggso-,> sPernodtbou>f(f),. raurng(sw-e>)r;e c v| b ^u ff, ar/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cppg:s13-:>1r:e dnote: Oin instantiation of member function 'RunWork, 0, 1>::run' requested herep Arg, 130 | *IPMrPoLt_oC:O:LMLa_xFGUrNoCu(pAWlildRtehd)u;c e ,| ^T REE, L/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hL:19942:85,: Pnote: rin instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested heree MulS u994m | , d o urbulneT)r e e| S^p lit ( aRrugnsW)o;r k <| n ^c clFunc#/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h#:f202u:n53c:, note: tin instantiation of member function 'RunWorkElement, 0, 1>::run' requested herey pe, F u202n | c # # d e v r e dRoupno,r kNEClCeLm_eAnLtGt(o)>.(r)u.nr(uwen)(;& n c| c ^l Shmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:451:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 451 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:491:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 491 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:533:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 533 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:994:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 994 | runTreeSplit(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, TREE, LL128, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 37 warnings generated when compiling for gfx90a. 37 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ ffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] In file included from 153/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp | : 1 : In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hu:i10n: tIn file included from 3/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h2:_169t: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.hd:a271t:a191:, warning: funused variable 'ptr' [-Wunused-variable]l ag1, data2, f271l | a g 2 ; | ^~~~~ ui/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.hn:t1536:435_:t *warning: unused variable 'flag2' [-Wunused-variable]p tr = r153e | c v P t ru(i0n)t+3l2l_1t2 8dOaftfas1e,t ;f l a| g ^~~1 , data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2,In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Sizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h ^ :562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid) ,562 | n t h r etaidds((tnitdh)r,e andtsh)r,e atdisd(InntBhlroecakd(st)h,r etaiddIIdnxB.lxo)c,k (gtrhoruepa(dgIrdoxu.px)),, g| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~o u p| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)g roup), 563 | | ^~~~~~~~~~~~~~~~~ s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:e562p:S60i:z enote: (field 'group' will be initialized after field 'stepSize'n cclShm e562m | . c o m mt.ibdu(ftfiSdi)z,e sn[tNhCrCeLa_dPsR(OnTtOh_rSeIaMdPsL)E,] /tNiCdCILn_BSlToEcPkS(/tshirzeeaodfI(dTx).)x ){, g| r ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~o u p| ( group(groupg roup), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/:N562C:C15L:_ Swarning: Tinitializer order does not match the declaration order [-Wreorder-ctor]E PS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~562 | | group(group tid(tid), nthreads(nthreads), tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hI:n275B:l90o:c knote: (in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heret hreadIdx .275x | ) , g r o uPpr(igmriotuipv)e,s < T| , ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ R e| d tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)O p, Fan A563s | y m m e tsrtiecpf,f S/i*zDeisr[eNcCtC=L*_/P0R,O TPOr_oStIoM,P L0E>] /pNrCiCmLs_ S T| E ^P S/sizeo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hf:(595T:)5): {note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | 595 group(group | runTreeUpDown, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereP rotoSim p275l | e < 1 , 1 >P>r(iamrigtsi)v;e s <| T ^, RedOp, FanA/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hs:y202m:m53e:t rnote: iin instantiation of member function 'RunWorkElement, 0, 2>::run' requested herec E,l e/m*eDnitro ,p rPirmost o >| ( ^) .run(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hw:e595):;5 : | note: ^in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp :r9u:n1T:r enote: ein instantiation of member function 'RunWork, 0, 2>::run' requested hereU pDown <9T | ,I MRPeLd_OCpO,L LP_rFoUtNoCS(iAllRmepdluecE>E(,a rSgIsM)P;L E ,| ^S umPostDi/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hv:,202 :u53i:n tnote: 6in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here4 _t) | 202^ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hR:u391n:W95o:r knote: Eexpanded from macro 'IMPL_COLL_FUNC'l ementu(n)c.,r utny(pwee,) ;F u n| c ^# #devred/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cppo:p9<:t1y:p enote: >in instantiation of member function 'RunWork, 0, 2>::run' requested here, NCC L9_ | AILMGPOL__#C#OaLlLg_oF,U NNCC(CALl_lPRReOdTuOc_e#,# pTrRoEtEo,> (S)I.MrPuLnE(,& nScucmlPSohsmteDmi.vw,o ruki)n;t 6\4 _ t| ) ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::562391::1595:: note: note: field 'nthreads' will be initialized after field 'tidInBlock'expanded from macro 'IMPL_COLL_FUNC' 562 | 391 | tRiudn(Wtoirdk)<,n cnctlhFruenacd#s#(fnutnhcr,e atdysp)e,, tFiudnIcn#B#ldoecvkr(etdhorpe.,x )N,C CgLr_oAuLpG(Og_r#o#uapl)g,o , | N ^~~~~~~~~~~~~~~~~C CL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hP:R562O:T60O:_ #note: #field 'group' will be initialized after field 'stepSize'p roto> (562) | . r u n (t&indc(ctliSdh)m,e mn.twhorreka)d;s (\n t h| r ^e ads), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:i562d:I15n:B lnote: ofield 'nthreads' will be initialized after field 'tidInBlock'c k(thre a562d | I d x . xt)i,d (gtriodu)p,( gnrtohurpe)a,d s (| n ^~~~~~~~~~~t hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 19 warnings generated when compiling for gfx908. 19 warnings generated when compiling for gfx90a. 19 warnings generated when compiling for gfx940. 19 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 19 warnings generated when compiling for gfx803. 19 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 19 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 19 warnings generated when compiling for host. 19 warnings generated when compiling for gfx1101. 19 warnings generated when compiling for gfx1100. 19 warnings generated when compiling for gfx906. 19 warnings generated when compiling for gfx900. 19 warnings generated when compiling for gfx1030. 19 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2,In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cppf:l1a: gIn file included from 2/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h;: 10 : | In file included from ^~~~~/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h :169/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h: :/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h153::27135::19 :warning: unused variable 'flag2' [-Wunused-variable]warning: unused variable 'ptr' [-Wunused-variable] 153 | uint32_ t271 | d a t a 1 , f luaign1t,6 4d_att*a 2p,t rf l=a gr2e;c v P| t ^~~~~r (0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Op, FanAsymmetric<1, NCCL_MAX_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h::562275::1590:: warning: note: initializer order does not match the declaration order [-Wreorder-ctor]in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Pr i562m | i t i v etsid,x ./x*)D,i rgercotu=p*(/g0r,o uPpr)o,t o ,| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~0 > | p tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)r ims | ^563 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hs:t595e:p5S:i znote: ein instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here( nccl S595h | m e m . croumnmT.rbeuefUfpSDiozwens<[TN,C CRLe_dPORpO,T OP_rSoItMoPSLiEm]p/lNeCE>P(Sa/rsgisz)e;o f (| T ^) ) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :| 202 group(group: 53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 324 :R90u:n Wnote: oin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herer kElemen t324< | F n , T , PRreidmOipt,i vAelsg,( )F.arnuAns(ywmem)e;t r i| c ^< 1, NCCL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cppM:A5X:_1D:E Vnote: _in instantiation of member function 'RunWork, 0, 2>::run' requested hereA RITY >5, | I/M*PDLi_rCeOcLtL=_*F/U0N,C (PArloltRoe,d u0c>e ,p rTiRmEsE , | S ^I MPLE, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hS:u595m:,5 :u inote: nin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested heret 8_t) 595 | | ^ runT/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:e391e:U95p:D onote: wexpanded from macro 'IMPL_COLL_FUNC'n c>#(#afrugnsc),; t y| p ^e , Func#/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h#:d202e:v53r:e dnote: oin instantiation of member function 'RunWorkElement, 0, 2>::run' requested herep | , N C C L _ A LRGuOn_W#o#raklEgloe,m eNnCtCl(g)o.,r uPnr(o&tnoc>c(l)S.hrmuenm(.wweo)r;k ) ;| ^\ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::1562:: 15note: :in instantiation of member function 'RunWork, 0, 2>::run' requested here note: field 'nthreads' will be initialized after field 'tidInBlock' 7 | IMP L562_ | C O L L _tFiUdN(Ct(iAdl)l,R endtuhcree,a dTsR(EnEt,h rSeIaMdPsL)E,, tSiudmI,n Bulionctk3(2t_htr)e a d| I^d x.x),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :g391r:o95u:p (note: gexpanded from macro 'IMPL_COLL_FUNC'r oup), | 391 ^~~~~~~~~~~~~~~~~ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hR:u562n:W60o:r knote: , NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElemen/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ t().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*:D562i:r15e:c twarning: =*initializer order does not match the declaration order [-Wreorder-ctor]/ 0, Proto, 0> prims | ^ 562 | tid(tid), nthrea/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hd:s595(:n5t:h rnote: ein instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested herea ds), tidI n595B | l o c k (rtuhnrTeraedeIUdpxD.oxw)n,< Tg,r oRuepd(Ogpr,o uPpr)o,t o S| i ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~m p l| e tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)< 1, 1>> (563a | r g s ) ;s t e| p ^S ize(ncc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hl:S202h:m53e:m .note: cin instantiation of member function 'RunWorkElement, 0, 2>::run' requested hereo mm.buf f202S | i z e s [ N C C LR_uPnRWOoTrOk_ESlIeMmPeLnEt]| ( ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~) . r| u group(groupn (we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h: 3247: | 90I:M Pnote: Lin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here_ COLL_F U324N | C ( A l l R ePdruicmei,t iTvReEsE<,T ,S IRMePdLOEp,, SFuamn,A suyimnmte3t2r_itc)< 1 ,| ^N CCL_MA/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hX:_391D:E95V:_ Anote: Rexpanded from macro 'IMPL_COLL_FUNC'I TY>, /*D i391r | e c tR=u*n/W0o,r kPc #p#rfiumnsc , | t ^y pe, Fu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hn:c595#:#5d:e vnote: rin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested heree dop< t595y | p e > , rNuCnCTLr_eAeLUGpOD_o#w#na,( )1.>r>u(na(r&gnsc)c;l S h| m ^e m.work); /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h\: 202 :| 53 ^: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :202562 | : 15 : note: field 'nthreads' will be initialized after field 'tidInBlock' RunWo r562k | E l e m etnitd<(Ftni,d )T,, nRtehdrOepa,d sA(lngtoh,r ePardost)o,> (t)i.drIunnB(lwoec)k;( t h| r ^e adIdx.x)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp,: 9g:r1o:u pnote: (in instantiation of member function 'RunWork, 0, 2>::run' requested hereg roup )9, | I M| P ^~~~~~~~~~~~~~~~~L _CO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL:L562_:F60U:N Cnote: (field 'group' will be initialized after field 'stepSize'A llRed u562c | e , T RtEiEd,( tSiIdM)P,L En,t hSruema,d su(inntth6r4e_atd)s ) ,| ^t idInBlo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hc:k391(:t95h:r enote: aexpanded from macro 'IMPL_COLL_FUNC'd Idx.x), 391g | r o uRpu(ngWroorukp<)n,c c l| F ^~~~~~~~~~~u nc##func, type, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:x562.:x15):, warning: ginitializer order does not match the declaration order [-Wreorder-ctor]r oup(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562562 | : 60 : note: tfield 'group' will be initialized after field 'stepSize'i d(tid) ,562 | n t h r etaidds((tnitdh)r,e andtsh)r,e atdisd(InntBhlroecakd(st)h,r etaiddIIdnxB.lxo)c,k (gtrhoruepa(dgIrdoxu.px)),, g| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~o u p| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)g roup), 563 | | ^~~~~~~~~~~ stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ X_DEV_ARITY>, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::562562::1515:: warning: warning: initializer order does not match the declaration order [-Wreorder-ctor]initializer order does not match the declaration order [-Wreorder-ctor] 562562 | | ttiidd((ttiidd)),, nntthhrreeaaddss((nntthhrreeaaddss)),, ttiiddIInnBBlloocckk((tthhrreeaaddIIddxx..xx)),, ggrroouupp((ggrroouupp)),, | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563563 | | sstteeppSSiizzee((nnccccllSShhmmeemm..ccoommmm..bbuuffffSSiizzeess[[NNCCCCLL__PPRROOTTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ O_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :10562 | :I15M:P Lwarning: _initializer order does not match the declaration order [-Wreorder-ctor]C OLL_FUNC(AllReduce ,562 | T R E E ,t iSIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | Run/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here WorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWor/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hk:<562ncclFunc##func, type, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 27 warnings generated when compiling for gfx90a. 27 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx908. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 27 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx1100. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for host. 27 warnings generated when compiling for gfx1030. 27 warnings generated when compiling for gfx1101. 27 warnings generated when compiling for gfx900. 27 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.htid), nth:r562e:a15d:s warning: (ninitializer order does not match the declaration order [-Wreorder-ctor]t hreads), tidInBlock(thre a562d | I d x . xt)i,d (gtriodu)p,( gnrtohurpe)a,d s (| n ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t h r| e tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)a ds), tidInBlo c563k | ( t h r esatdeIpdSxi.zxe)(,n cgcrloSuhpm(egmr.ocuopm)m,. b u| f ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~f S i| z tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)e s[NCCL _563P | R O T O _sStIeMpPSLiEz]e/(NnCcCcLl_SShTmEePmS./csoimzme.obfu(fTf)S)i z{e s [| N ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~C C L| _ group(groupP ROTO_SIMPLE]/NCCL_STEPS/s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hi:z324e:o90f:( Tnote: )in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | 324 group(group | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herem metric< 1324, | N C C L _ MPArXi_mDiEtVi_vAeRsI ,R e/d*ODpi,r eFcatn=A*s/y0m,m ePtrroitco<,1 ,0 >N CpCrLi_mMsA X _| D ^E V_ARIT/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hY:>595,: 5/:* Dnote: iin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested herer ect= *595/ | 0 , P rroutnoT,r e0e>U ppDroiwmns< T ,| ^R edOp, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hP:r595o:t5o:S inote: min instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested herep le<1, 5951 | > > ( a rrgusn)T;r e e| U ^p Down, 0, 2>::run' requested herer otoSi m202p | l e < 1 , 1 > >R(uanrWgosr)k;E l e| m ^e nt, 0, 2>::run' requested here Algo, 202P | r o t o > ( ) . rRuunn(Wwoer)k;E l e| m ^e nt, 0, 2>::run' requested here Algo ,4 | PIrMoPtLo_>C(O)L.Lr_uFnU(NwCe()A;l l R| e ^d uce, TRE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cppE:,6 :S1I:M Pnote: Lin instantiation of member function 'RunWork, 0, 2>::run' requested hereE , Pr o6d | ,I MiPnLt_8C_OtL)L _ F| U^N C(AllR/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:d391u:c95e:, note: Texpanded from macro 'IMPL_COLL_FUNC'R EE, SIM P391L | E , RPurnoWdo,r kiR,u nNWCoCrLk_r(e)d.orpuc,l SNhCmCeLm_.AwLoGrOk_)#;# a\l g o| , ^ NCCL_P/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hR:O562T:O15_:# #note: pfield 'nthreads' will be initialized after field 'tidInBlock'r oto>() .562r | u n ( & ntcicdl(Sthimde)m,. wnotrhkr)e;a d\s ( n| t ^h reads),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :t562i:d15I:n Bnote: lfield 'nthreads' will be initialized after field 'tidInBlock'o ck(thr e562a | d I d x .txi)d,( tgirdo)u,p (ngtrhoruepa)d,s ( n| t ^~~~~~~~~~~~~~~~~h rea/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:s562):,60 :t inote: dfield 'group' will be initialized after field 'stepSize'I nBlock (562t | h r e a dtIiddx(.txi)d,) ,g rnotuhpr(egardosu(pn)t,h r e| a ^~~~~~~~~~~~~~~~~d s), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:i562d:I60n:B lnote: ofield 'group' will be initialized after field 'stepSize'c k(thr e562a | d I d x .txi)d,( tgirdo)u,p (ngtrhoruepa)d,s ( n| t ^~~~~~~~~~~h reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ o>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threa T, RedOp, Algo, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | ste/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ pSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ >(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h>(args); | 562 ^ | tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h(:t202i:d53):, note: nin instantiation of member function 'RunWorkElement, 0, 2>::run' requested heret hread s202( | n t h r e a d s )R,u ntWiodrIknEBlleomcekn(tt ( )| . ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~r u n| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)w e); | ^563 | st/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cppe:p6S:i1z:e (note: nin instantiation of member function 'RunWork, 0, 2>::run' requested herec clSh m6e | mI.McPoLm_mC.ObLuLf_fFSUiNzCe(sA[lNlCRCeLd_uPcReO,T OT_RSEIEM,P LSEI]M/PNLCEC,L _PSrToEdP,S /isnitz3e2o_ft()T ) )| ^{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :| 391 group(group: 95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hr:k275<:n90c:c lnote: Fin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereu nc##fun c275, | t y p e , PFruinmci#t#idveevsr ,F aNnCACsLy_mAmLeGtOr_i#c#t,o >/(*)D.irruenc(t&=n*c/c0l,S hPmreomt.ow,o r0k>) ;p r\i m | s ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:: 595note: :field 'nthreads' will be initialized after field 'tidInBlock'5 : note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 562 | 595 | t i d (rtuindT)r,e enUtphDroewandea>d(Iadrxg.sx));, g| r ^o up(group)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h,: 202 :| 53 ^~~~~~~~~~~~~~~~~: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:60: 202note: | field 'group' will be initialized after field 'stepSize' 562R | u n W otrikdE(lteimde)n,t l(o)c.kr(utnh(rweea)d;I d x| . ^x ), grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cppp:(9g:r1o:u pnote: )in instantiation of member function 'RunWork, 0, 2>::run' requested here, | ^~~~~~~~~~~ 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | ste/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hp:S562i:z15e:( nwarning: cinitializer order does not match the declaration order [-Wreorder-ctor]c lShmem.comm.buff S562i | z e s [ NtCiCdL(_tPiRdO)T,O _nStIhMrPeLaEd]s/(NnCtChLr_eSaTdEsP)S,/ stiizdeIonfB(lTo)c)k ({t h| r ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~e a d| I group(groupd x.x), group(group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h):,275 : 90| : ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 275 | 563 | sPtreipmSiitzieve(snL,_ S/T*EDPiSr/escitz=e*o/f0(,T )P)r o{t o ,| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~0 > | p group(groupr ims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h::275595::590:: note: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested herein instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 595 | 275 | r u n T r ePerUipmDiotwinvN>C(CaLr_gMsA)X;_ D E| V ^_ ARITY, 1/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h>:,202 :/53*:D inote: rin instantiation of member function 'RunWorkElement, 0, 2>::run' requested heree ct=*/ 0202, | P r o t o , 0R>u npWroirmksE l e| m ^e nt, ProtoSimple<1, 1>>' requested hereO p, A l595g | o , P rroutnoT>r(e)e.UrpuDno(wwne<)T;, R| e ^d Op, Prot/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cppo:S9i:m1p:l enote: , 0, 2>::run' requested here1 , 1> >9( | aIrMgPsL)_;C O L| L ^_ FUNC(All/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hR:e202d:u53c:e ,note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested hereT REE, S202I | M P L E , P r oRdu,n WuoirnktE6l4e_mte)n t <| F^n , T, Re/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hd:O391p:,95 :A lnote: gexpanded from macro 'IMPL_COLL_FUNC'o , Proto> (391) | . r unR(uwneW)o;r k< n| c ^c lFunc##f/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cppu:n8c:,1 :t ynote: pin instantiation of member function 'RunWork, 0, 2>::run' requested heree , Fu n8c | #I#MdPeLv_rCeOdLoLp_A,l lNRCeCdLu_cAeL,G OT_R#E#Ea,l gSoI,M PNLCEC,L _PPrRoOdT,O _i#n#tp6r4o_tto)> ( )| .^r un(&nc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hc:l391S:h95m:e mnote: .expanded from macro 'IMPL_COLL_FUNC'w ork); \ 391| | ^ RunW/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:562r:k15<:n cnote: cfield 'nthreads' will be initialized after field 'tidInBlock'l Func## f562u | n c , ttyipde(,t iFdu)n,c #n#tdherveraeddso(pnd,s )N,C CtLi_dAILnGBOl_o#c#ka(ltghor,e aNdCICdLx_.PxR)O,T Og_r#o#uppr(ogtroo>u(p)).,r u n| ( ^~~~~~~~~~~~~~~~~& ncc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hl:S562h:m60e:m .note: wfield 'group' will be initialized after field 'stepSize'o rk); \562 | | ^ tid(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:i562d:)15,: nnote: tfield 'nthreads' will be initialized after field 'tidInBlock'h reads( n562t | h r e a dtsi)d,( ttiidd)I,n Bnltohcrke(atdhsr(enatdhIrdexa.dxs)),, gtrioduIpn(Bglroocukp()t,h r e| a ^~~~~~~~~~~d Idx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElemen/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ t().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllR/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ educe, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx940. 27 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ 27 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for host. 27 warnings generated when compiling for gfx1030. 27 warnings generated when compiling for gfx1102. 27 warnings generated when compiling for gfx90a. 27 warnings generated when compiling for gfx941. 27 warnings generated when compiling for gfx900. 27 warnings generated when compiling for gfx803. 27 warnings generated when compiling for gfx1100. 27 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid)In file included from , nthreads/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp(:n1t: hIn file included from r/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.he:a10d: sIn file included from )/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h,: 167t: i/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:I562n:B15l:o cwarning: kinitializer order does not match the declaration order [-Wreorder-ctor]( threadIdx.x), group(group), | 562 ^~~~~~~~~~~~~~~~~ | tid(tid), nthreads(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:t562h:r60e:a dnote: sfield 'group' will be initialized after field 'stepSize') , tidInBlock(t h562r | e a d I dtxi.dx()t,i dg)r,o unpt(hgrreoaudps)(,n t h| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~e a d| s tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) , tidI n563B | l o c k (sttherpeSaidzIed(xn.cxc)l,S hgmreomu.pc(ogmrmo.ubpu)f,f S i| z ^~~~~~~~~~~e s[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffS/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ izes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ idInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##a/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lgo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ <1, 1>>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h note: field 'nthreads' will be initialized after field 'tidInBlock' :562: 15562: | warning: initializer order does not match the declaration order [-Wreorder-ctor] tid(tid), nthreads(nthrea d562s | ) , t itdiIdn(Btliodc)k,( tnhtrheraedaIddsx(.nxt)h,r egardosu)p,( gtrioduIpn)B,l o c| k ^~~~~~~~~~~~~~~~~( thr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:a562d:I60d:x .note: xfield 'group' will be initialized after field 'stepSize') , gro u562p | ( g r o utpi)d,( t i| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~) , | n tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)t hreads (563n | t h r e asdtse)p,S itzied(InncBclloSchkm(etmh.rceoamdmI.dbxu.fxf)S,i zgerso[uNpC(CgLr_oPuRpO)T,O _ S| I ^~~~~~~~~~~M PLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:: 562note: :in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] 595 | runTreeUpDo w562n | < T , RteiddO(pt,i dP)r,o tnotShirmepaldes<(1n,t h1r>e>a(dasr)g,s )t;i d I| n ^B lock(th/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:e202a:d53I:d xnote: .in instantiation of member function 'RunWorkElement, 0, 2>::run' requested herex ), gr o202u | p ( g r o u p ) ,R u n| W ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~o r k| E tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)l ement< F563n | , T , sRteedpOSpi,z eA(lngcoc,l SPhrmoetmo.>c(o)m.mr.ubnu(fwfeS)i;z e s| [ ^N CCL_PROT/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cppO:_12S:I1M:P Lnote: Ein instantiation of member function 'RunWork, 0, 2>::run' requested here] /NCC L12_ | SITMEPPLS_/CsOiLzLe_oFfU(NTC)()A l{l R e| d ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~u c e| , group(group TREE, SIMPLE, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hM:a324x:,90 :d onote: uin instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereb le) | ^ 324 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 391P:r95i:m inote: texpanded from macro 'IMPL_COLL_FUNC'i vesv,r e/d*oDpi*,/ 0N,C CPLr_oAtLoG,O _0#># aplrgiom,s N C| C ^L _PROTO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h_:#595#:p5r:o tnote: oin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here> ().r u595n | ( & n c crluSnhTmreeme.UwpoDrokw)n;< T\, R| e ^d Op, Pr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:t562o:S15i:m pnote: lfield 'nthreads' will be initialized after field 'tidInBlock'e <1, 1> >562( | a r g s )t;i d (| t ^i d), nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:e202a:d53s:( nnote: tin instantiation of member function 'RunWorkElement, 0, 2>::run' requested hereh read s202) | , t i d I n B lRoucnkW(otrhkrEelaedmIednxt.:(60):. rnote: ufield 'group' will be initialized after field 'stepSize'n (we); 562 | | ^ tid(tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp):,10 :n1t:h rnote: ein instantiation of member function 'RunWork, 0, 2>::run' requested herea ds(n t10h | rIeMaPdLs_)C,O LtLi_dFIUnNBCl(oAclkl(Rtehdruecaed,I dTxR.ExE),, SgIrMoPuLpE(,g rMoauxp,) ,h a l| f ^~~~~~~~~~~) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx90a. 27 warnings generated when compiling for gfx940. 27 warnings generated when compiling for gfx803. 27 warnings generated when compiling for gfx908. 27 warnings generated when compiling for gfx941. 27 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx1100. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for host. 27 warnings generated when compiling for gfx906. 27 warnings generated when compiling for gfx1102. 27 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uin/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ t32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthrea/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPIn file included from LE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp,: 1M: iIn file included from n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h,: 10u: iIn file included from n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.ht:8167_: t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h): 562 :| 15^: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 562 | 391 | t i dR(utniWdo)r,k ),, NgCrCoLu_pA(LgGrOo_u#p#)a,l g o| , ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ N C| C tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)L _PROTO_ #563# | p r o t os>t(e)p.Sriuzne((&nnccccllSShhmmeemm..cwoomrmk.)b;u f\f S i| z ^e s[NCCL_PROTO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h_:S562I:M15P:L Enote: ]field 'nthreads' will be initialized after field 'tidInBlock'/ NCCL_STE P562S | / s i z etoifd((Tt)i)d ){, n| t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~h r e| a group(groupd s(nthreads), tidInBlock(thre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ha:d275I:d90x:. xnote: )in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here, group(g r275o | u p ) , | P ^~~~~~~~~~~~~~~~~r imi/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:i562v:e60s:< Tnote: ,field 'group' will be initialized after field 'stepSize' RedOp, 562F | a n A s ytmimde(ttriidc)<,N CnCtLh_rMeAaXd_sD(EnVt_hArReIaTdYs,) ,1 t>i,d I/n*BDliorcekc(tt=h*r/e0a,d IPdrxo.txo),, 0g>r opurpi(mgsr o u| p ^) , | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ A562L | G O _ # #taildg(ot,i dN)C,C Ln_tPhRrOeTaOd_s#(#nptrhorteoa>d(s)).,r utni(d&InncBclloSchkm(etmh.rweoardkI)d;x .\x ) ,| ^g roup(gro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:p562):,15 : | note: ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~field 'nthreads' will be initialized after field 'tidInBlock' | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 562 | 563 | t i d (sttiedp)S,i znet(hnrcecaldSsh(mnetmh.rceoamdms.)b,u ftfiSdiIzneBsl[oNcCkC(Lt_hPrReOaTdOI_dSxI.MxP)L,E ]g/rNoCuCpL(_gSrToEuPpS)/,s i z| e ^~~~~~~~~~~~~~~~~o f(T/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h):)562 :{60 : | note: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~field 'group' will be initialized after field 'stepSize' | group(group 562 | tid(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hi:d324):,90 :n tnote: hin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herer eads(nth r324e | a d s ) , PtriidmIintBilvoecsk<(Tt,h rReeaddOIpd,x .Fxa)n,A sgyrmomuept(rgirco, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/N/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ CCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h 391: | 562 : 15R:u nwarning: Winitializer order does not match the declaration order [-Wreorder-ctor]o rke,a dNsC)C,L _tAiLdGIOn_B#l#oaclkg(ot,h rNeCaCdLI_dPxR.OxT)O,_ #g#rporuopt(og>r(o)u.pr)u,n ( &| n ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~c c l| S tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)h mem.wor k563) | ; \ s| t ^e pSize(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:c562c:l15S:h mnote: efield 'nthreads' will be initialized after field 'tidInBlock'm .comm. b562u | f f S i zteisd[(NtCiCdL)_,P RnOtThOr_eSaIdMsP(LnEt]h/rNeCaCdLs_)S,T EtPiSd/IsniBzleoocfk((Tt)h)r e{a d I| d ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~x . x| ) group(group, group(group), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :| 324 ^~~~~~~~~~~~~~~~~: 90: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hnote: :in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here562 :60: note: field 'group' will be initialized after field 'stepSize' 324 | 562 | P r i mtiitdi(vteisd<)T,, nRtehdrOepa,d sF(anntAhsryemamdest)r,i ct,, g/r*oDuipr(egcrto=u*p/)0,, P| r ^~~~~~~~~~~o to, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd(:t562i:d15):, warning: ninitializer order does not match the declaration order [-Wreorder-ctor]t hreads(nthrea d562s | ) , t itdiIdn(Btliodc)k,( tnhtrheraedaIddsx(.nxt)h,r egardosu)p,( gtrioduIpn)B,l o c| k ^~~~~~~~~~~~~~~~~( thr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:a562d:I60d:x .note: xfield 'group' will be initialized after field 'stepSize') , grou p562( | g r o u pt)i,d ( t| i ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~d ) ,| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)n thread s563( | n t h r esatdesp)S,i ztei(dnIcncBllSohcmke(mt.hcroemamd.Ibduxf.fxS)i,z egsr[oNuCpC(Lg_rPoRuOpT)O,_ S I| M ^~~~~~~~~~~P LE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :| 562 ^~~~~~~~~~~~~~~~~: 15:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :warning: 562initializer order does not match the declaration order [-Wreorder-ctor]: 60: note: field 'group' will be initialized after field 'stepSize' 562 | t i562d | ( t i d )t,i dn(tthirde)a,d sn(tnhtrheraedasd(sn)t,h rteiaddIsn)B,l otcikd(ItnhBrleoacdkI(dtxh.rxe)a,d Igdrxo.uxp)(,g rgoruopu)p,( g r| o ^~~~~~~~~~~u p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(w/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement(). r562u | n ( w e )t;i d (| t ^i d), nthr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cppe:a9d:s1(:n tnote: hin instantiation of member function 'RunWork, 0, 2>::run' requested herer eads )9, | ItMiPdLI_nCBOlLoLc_kF(UtNhCr(eAaldlIRdexd.uxc)e,, gTrRoEuEp,( gSrIoMuPpL)E,, M| i ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~n , | u tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)i nt64_t )563 | | ^ stepS/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hi:z391e:(95n:c cnote: lexpanded from macro 'IMPL_COLL_FUNC'S hmem.com m391. | b u fRfuSniWzoersk[ , | N ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~C C L| _ group(groupA LGO_##algo, NCCL_P/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hR:O324T:O90_:# #note: pin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herer oto>().r u324n | ( & n c c l SPhrmiemmi.twiovreks)<;T ,\ R e| d ^O p, Fan/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hA:s562y:m15m:e tnote: rfield 'nthreads' will be initialized after field 'tidInBlock'i c<1, N C562C | L _ M A Xt_iDdE(Vt_iAdR)I, nthTrYe>a,d s/(*nDtihrreecatd=s*)/,0 ,t iPdrIontBol,o c0k>( tphrriemasd I d| x ^. x), gr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ho:u595p:(5g:r onote: uin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested herep ), | 595 ^~~~~~~~~~~~~~~~~ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :r562u:n60T:r enote: efield 'group' will be initialized after field 'stepSize'U pDown< T562, | R e d Otpi,d (Ptriodt)o,S inmtphlreet>h(raeragdss));, t| i ^d InBloc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hk:(202t:h53r:e anote: din instantiation of member function 'RunWorkElement, 0, 2>::run' requested hereI dx.x )202, | g r o u p ( g rRouunpW)o,r k E| l ^~~~~~~~~~~e ment().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ e); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h):,562 : 15| : ^~~~~~~~~~~~~~~~~ warning: initializer order does not match the declaration order [-Wreorder-ctor]/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:60: note: field 'group' will be initialized after field 'stepSize' 562 | 562t | i d ( t itdi)d,( tnitdh)r,e andtsh(rnetahdrse(andtsh)r,e atdisd)I,n BtliodcIkn(Btlhorceka(dtIhdrxe.axd)I,d xg.rxo)u,p (ggrroouupp()g,r o u| p ^~~~~~~~~~~) , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx908. 27 warnings generated when compiling for gfx941. 27 warnings generated when compiling for gfx90a. 27 warnings generated when compiling for gfx90a. 27 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 27 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx1100. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for host. 27 warnings generated when compiling for gfx1102. 27 warnings generated when compiling for gfx906. 27 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, LL128, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, LL128, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, LL128, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, LL128, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, LL128, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, LL128, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, LL128, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, LL128, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, LL128, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, LL128, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, LL128, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, LL128, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 13 warnings generated when compiling for gfx90a. 13 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, RING, LL128, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gIn file included from r/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cppo:u1p: (In file included from g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hr:o10u: pIn file included from )/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h,: 167 : | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h ^~~~~~~~~~~: 562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().raun(we); | r ^g s); | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp ^: 4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllR/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:d202u:c53e:, note: Tin instantiation of member function 'RunWorkElement, 0, 2>::run' requested hereR EE, SIMPLE, P202r | e M u l S u m , RiunntW8o_rtk)E l e| m^e ntn(W)o.rrku, 0, 2>::run' requested here# #devr e4d | oIpML,L _NFCUCNLC_(AALlGlOR_e#d#uacleg,o ,T NRCECEL,_ PSRIOMTPOL_E#,# pPrroetMou>l(S)u.mr,u ni(n&tn8c_ctl)S h m| e^m .work);/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :\391 : 95| : ^ note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: 391note: | field 'nthreads' will be initialized after field 'tidInBlock' RunWo r562k | < n c c ltFiudn(ct#i#df)u,n cn,t htryepaed,s (Fnutnhcr#e#addesv)r,e dtoipdc,k (NtChCrLe_aAdLIGdOx_.#x#)a,l ggor,o uNpC(CgLr_oPuRpO)T,O _ #| # ^~~~~~~~~~~~~~~~~p rot/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:>562(:)60.:r unote: nfield 'group' will be initialized after field 'stepSize'( &ncclS h562m | e m . w otrikd)(;t i\d ) ,| ^n threads(nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:e562a:d15s:) ,note: field 'nthreads' will be initialized after field 'tidInBlock't idInBlock (562t | h r e a dtIiddx(.txi)d,) ,g rnotuhpr(egardosu(pn)t,h r e| a ^~~~~~~~~~~d s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hin instantiation of member function 'RunWorkElement, 0, 2>::run' requested here: 562:15 :202 | warning: initializer order does not match the declaration order [-Wreorder-ctor] RunWorkElement (n)t.hrruena(dwse()n;t h r| e ^a ds), tidI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cppn:B6l:o1c:k (note: tin instantiation of member function 'RunWork, 0, 2>::run' requested hereh readI d6x | .IxM)P,L _gCrOoLuLp_(FgUrNoCu(pA)l,l R e| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~u c e| , tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) TREE, S563I | M P L E ,s tPerpeSMiuzleS(unmc,c liSnhtm3e2m_.tc)o m m| .^b uffSize/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hs:[391N:C95C:L _note: Pexpanded from macro 'IMPL_COLL_FUNC'R OTO_SIMP L391E | ] / NRCuCnLW_oSrTkE, NCCL_ALGO_##alg/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ho:,275 :N90C:C Lnote: _in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereP ROTO_## p275r | o t o > ( ) .Prruinm(i&tnicvcelsSd,( t/i*dD)i,r enctth=r*e/a0d,s (Pnrtohtroe,a d0s>) ,p rtiimdsI n B| l ^o ck(thre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ha:d595I:d5x:. xnote: )in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here, gro u595p | ( g r o urpu)n,T r e| e ^~~~~~~~~~~~~~~~~U pD/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:w562n:<60T:, note: Rfield 'group' will be initialized after field 'stepSize'e dOp, ProtoSimple<1, 1>>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ idInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(thre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ha:d562I:d15x:. xwarning: )initializer order does not match the declaration order [-Wreorder-ctor], group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ITY>, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ha:ds562):,15 :t iwarning: dinitializer order does not match the declaration order [-Wreorder-ctor]I nBlock(threadIdx .562x | ) , g rtoiudp((tgirdo)u,p )n,t h r| e ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~a d s| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)n thread s563) | , t i dsItneBplSoiczke((tnhcrcelaSdhImdexm..xc)o,m mg.rbouufpf(Sgirzoeusp[)N,C C L| _ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~P R O| T tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)O _SIMPL E563] | / N C C Ls_tSeTpESPiSz/es(inzcecolfS(hTm)e)m .{c o m| m ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~. b u| f group(groupf Sizes[NCCL_PROTO_SIMPLE]/NCCL_S/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hT:E275P:S90/:s inote: zin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heree of(T)) { 275 | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heree tricT,, /R*eDdiOrpe,c tF=a*n/A0s,y mPmreottroi,c <0N>C CpLr_iMmAsX _ D| E ^V _ARITY,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :1595>:,5 :/ *note: Din instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested herei rect= *595/ | 0 , P rroutnoT,r e0e>U ppDroiwmns< T ,| ^R edOp, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hP:r595o:t5o:S inote: min instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested herep le<1 ,595 | 1 > > ( arrugnsT)r;e e U| p ^D own, 0, 2>::run' requested hereo Simpl e202< | 1 , 1 > > ( a rRgusn)W;o r k| E ^l ement, 0, 2>::run' requested herep , Alg o202, | P r o t o > ( )R.urnuWno(rwkeE)l;e m e| n ^t , 0, 2>::run' requested herel go, P r9o | tIoM>P(L)_.CrOuLnL(_wFeU)N;C ( A| l ^l Reduce, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cppT:R7E:E1,: Snote: Iin instantiation of member function 'RunWork, 0, 2>::run' requested hereM PLE, P7r | eIMMuPlLS_uCmO,L Lu_iFnUtN6C4(_Atl)l R e| d^u ce, TR/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hE:E391,: 95S:I Mnote: Pexpanded from macro 'IMPL_COLL_FUNC'L E, PreMu l391S | u m ,R uuniWnotr3k2<_ntc)c l F| u^n c##fun/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hc:,391 :t95y:p enote: ,expanded from macro 'IMPL_COLL_FUNC' Func##de v391r | e d oRpu<,n cNcClCFLu_nAcL#G#Of_u#n#ca,l gtoy,p eN,C CFLu_nPcR#O#TdOe_v#r#epdroopty(p)e.>r,u nN(C&CnLc_cAlLSGhOm_e#m#.awlogrok,) ;N C\C L _| P ^R OTO_##pro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:o562>:(15):. rnote: ufield 'nthreads' will be initialized after field 'tidInBlock'n (&nccl S562h | m e m . wtoirdk()t;i d\) , | n ^t hreads(n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:h562r:e15a:d snote: )field 'nthreads' will be initialized after field 'tidInBlock', tidIn B562l | o c k ( tthirde(atdiIdd)x,. xn)t,h rgeraodusp((ngtrhoruepa)d,s ) ,| ^~~~~~~~~~~~~~~~~t idI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:B562l:o60c:k (note: tfield 'group' will be initialized after field 'stepSize'h readId x562. | x ) , gtrid(tiodu)p,( gnrtohurpe)a,d s (| n ^~~~~~~~~~~~~~~~~t hre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ha:d562s:)60,: tnote: ifield 'group' will be initialized after field 'stepSize'd InBloc k562( | t h r e atdiIdd(xt.ixd)),, gnrtohurpe(agdrso(unpt)h,r e a| d ^~~~~~~~~~~s ), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>()./usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:u562n:(15&:n cwarning: cinitializer order does not match the declaration order [-Wreorder-ctor]l Shmem.work); \ | ^ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :t562i:d15(:t inote: dfield 'nthreads' will be initialized after field 'tidInBlock') , nthr e562a | d s ( n tthirde(atdisd)),, tnitdhIrneBaldosc(kn(tthhrreeaaddsI)d,x .txi)d,I ngBrlooucpk((gtrhoruepa)d,I d x| . ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~x ) ,| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)g roup(g r563o | u p ) , s t| e ^~~~~~~~~~~~~~~~~p Siz/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:(562n:c60c:l Snote: hfield 'group' will be initialized after field 'stepSize'm em.com m562. | b u f f Stiizde(st[iNdC)C,L _nPtRhOrTeOa_dSsI(MnPtLhEr]e/aNdCsC)L,_ StTiEdPISn/Bsliozceko(ft(hTr)e)a d{I d x| . ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~x ) ,| group(groupg roup(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpD/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ own>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_P/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx941. 27 warnings generated when compiling for gfx90a. 27 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 27 warnings generated when compiling for gfx908. 27 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx940. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:275:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 275 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:324:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 324 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:595:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 595 | runTreeUpDown>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, TREE, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 27 warnings generated when compiling for host. 27 warnings generated when compiling for gfx1102. 27 warnings generated when compiling for gfx803. 27 warnings generated when compiling for gfx1100. 27 warnings generated when compiling for gfx1101. 27 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here In file included from 6/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp | :I1M: PIn file included from L/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h_:C10O: LIn file included from L/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h_:F169U: N/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.hC:(509A:l29l:R ewarning: dfield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor]u ce, RING, LL128, P507r | e M u l Stuimd,( tuiidn)t,8 _ntt)h r e| a^d s(nthr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:a391d:s95):, note: wexpanded from macro 'IMPL_COLL_FUNC'i d(tid%WA R391P | _ S IRZuEn)W,o rk | , N C CwLa_rApLIGnOB_l#o#cakl(gtoh,r eNaCdCILd_xP.RxO/TWOA_R#P#_pSrIoZtEo)>,( ) .| r ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~u n (| & warp(tid/WARP_SIZEn cclSh m509e | m . w o rfkl)a;g T\h r e| a ^d ((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:986:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 986 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(AllReduce, RING, LL128, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t daIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ ta1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx942. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1,In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cppf:l1a: gIn file included from 1/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h,: 10d: aIn file included from t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.ha:2169,: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.hf:l271a:g192:; warning: unused variable 'ptr' [-Wunused-variable]| ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 271 | 153 | u i nuti3n2t_6t4 _dta*t ap1t,r f=l arge1c,v Pdtart(a02),+ lfll1a2g82O;f f s| e ^~~~~t ; /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h :| 153 ^~~: 28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :563562 | : 15 : warning: sinitializer order does not match the declaration order [-Wreorder-ctor]t epSize(ncclShmem.co m562m | . b u f ftSiidz(etsi[dN)C,C Ln_tPhRrOeTaOd_sS(InMtPhLrEe]a/dNsC)C,L _tSiTdEIPnSB/lsoiczke(otfh(rTe)a)d I{d x .| x ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~) , | g group(groupr oup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :56368 | : 56 : note: sin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested heret epSiz e68( | n c c l SPhrmiemmi.tciovmems.L,E ]0/,N CPCrLo_tSoT,E P0S>/ spirziemosf ( T| ) ^) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 588| : group(group5 : note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRi/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hn:g68<:T56,: Rnote: ein instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested hered Op, P r68o | t o > ( aPrrgism)i;t i v| e ^s , 1, 2>::run' requested herey mmetr i202c | < 1 > , 0 , PRruontWoo,r k0E>l epmreinmts< F n| , ^ T, RedO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hp:,588 :A5l:g onote: ,in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here Pro t588o | > ( ) . rruunn(Rwien)g;< T ,| ^R edOp, P/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cppr:oto>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | ru/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:h562r:e15a:d Iwarning: dinitializer order does not match the declaration order [-Wreorder-ctor]x .x), group(group), 562| | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :588562 | : 15 : warning: rinitializer order does not match the declaration order [-Wreorder-ctor]u nRingt(iadr(gtsi)d;) , | n ^t hreads/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h(:n202t:h53r:e anote: din instantiation of member function 'RunWorkElement, 1, 2>::run' requested heres ), ti d202I | n B l o c k ( t hRruenaWdoIrdkxE.lxe)m,e ngtr563( | ) . r u ns(tweep)S;i z e| ( ^n cclShmem.c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cppo:m12m:.1b:uffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 17 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 7 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreadIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cppIn file included from :/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp4::11: :In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hnote: :in instantiation of member function 'RunWork, 1, 2>::run' requested here10 : In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h: 1674: | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hI:M562P:L15_:C Owarning: Linitializer order does not match the declaration order [-Wreorder-ctor]L _FUNC(AllReduce, RING ,562 | S I M P LtEi,d (Mtaixd,) ,i nntth8r_eta)d s (| n^t hreads), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:i391d:I95n:B lnote: oexpanded from macro 'IMPL_COLL_FUNC'c k(thread I391d | x . xR)u,n Wgorrokul,S hNmCeCmL._cAoLmGmO._b#u#faflSgioz,e sN[CNCCLC_LP_RPORTOOT_O#_#SpIrMoPtLoE>](/)N.CrCuLn_(S&TnEcPcSl/Sshimzeemo.fw(oTr)k)) ;{ \ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~| ^ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h562: | 68 : 56 : tnote: idin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here( tid), 68n | t h r e aPdrsi(mnitthirveeasdx,) ,0 ,g rPoruopt(og,r o0u>p )p,r i m| s ^~~~~~~~~~~~~~~~~ | ^/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588 :5625 | : note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here tid (588t | i d ) , rnutnhRrienagdI(naBrlgosc)k;( t h| r ^e adIdx.x/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h):,202 :g53r:o unote: pin instantiation of member function 'RunWorkElement, 1, 2>::run' requested here( group )202, | | ^~~~~~~~~~~ RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hi:d562(:t15i:d )warning: ,initializer order does not match the declaration order [-Wreorder-ctor] nthreads(nthreads), 562t | i d I n Btliodc(kt(itdh)r,e andtIhdrxe.axd)s,( ngtrhoruepa(dgsr)o,u pt)i,d I n| B ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~l o c| k tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)( threadI d563x | . x ) , sgtreopuSpi(zger(onucpc)l,S h m| e ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~m . c| o tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)m m.buffS i563z | e s [ N CsCtLe_pPSRiOzTeO(_nScIcMlPSLhEm]e/mN.CcCoLm_mS.TbEuPfSf/Ssiizzeeso[fN(CTC)L)_ P{R O T| O ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~_ S I| M group(groupP LE]/NCCL_STEPS/sizeof/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h(:T68):)56 :{ note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 68 | Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested hereF anSym m68e | t r i c i,m i0t,i vPersod Oppr,i mFsa n S| ^y mmetri/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hc:<5881:>5,: 0note: ,in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here Prot o588, | 0 > prruinmRsi n g| < ^T , RedO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hp:,588 :P5r:o tnote: oin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here> (ar g588s | ) ; | r ^u nRing, 1, 2>::run' requested hereP roto> (202a | r g s ) ; | ^R unWor/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hk:E202l:e53m:e nnote: tin instantiation of member function 'RunWorkElement, 1, 2>::run' requested here< Fn, T202, | R e d O p , ARlugnoW,o rPkrEoltoe>m(e)n.trin instantiation of member function 'RunWork, 1, 2>::run' requested here( ).run (8w | eI)M;P L _| C ^O LL_FUNC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp(:A7l:l1R:e dnote: uin instantiation of member function 'RunWork, 1, 2>::run' requested herec e, R I7N | GI,M PSLI_MCPOLLEL,_ FMUaNxC,( AilnltR6e4d_utc)e , | R^I NG, SI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hM:P391L:E95,: Mnote: aexpanded from macro 'IMPL_COLL_FUNC'x , uint32 _391t | ) R| u^n Workc,, NtCyCpLe_,A LFGuOn_c####adlegvor,e dNoCpCT,O _N#C#CpLr_oAtLoG>O(_)#.#raulng(o&,n cNcClCSLh_mPeRmO.TwOo_r#k#)p;r o\t o >| ( ^) .run(&/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:c562c:l15S:h mnote: efield 'nthreads' will be initialized after field 'tidInBlock'm .work) ;562 | \ | ^t id(tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h):,562 :n15t:h rnote: efield 'nthreads' will be initialized after field 'tidInBlock'a 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :562:60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h 562 | : 562 : 15 :t iwarning: dinitializer order does not match the declaration order [-Wreorder-ctor]( tid), nthreads(nthreads), tid I562n | B l oc k (ttihdr(etaiddI)d,x .nxt)h,r egardosu(pn(tghrroeuapd)s,) , | t ^~~~~~~~~~~i dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, S/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hI:M562P:L15E:, warning: Minitializer order does not match the declaration order [-Wreorder-ctor]a x, half) | ^ 562/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h | : 391 : 95 :t inote: dexpanded from macro 'IMPL_COLL_FUNC'( tid), nth r391e | a d sR(unntWhorreka,, N| C ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~C L _| A tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)L GO_##a l563g | o , N CsCtLe_pPSRiOzTeO(_n#c#cplrSohtmoe>m(.)c.ormumn.(b&unfcfcSliSzhemse[mN.CwCoLr_kP)R;O T\O _ S| I ^M PLE]/NCCL_S/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hT:E562P:S15/:s inote: zfield 'nthreads' will be initialized after field 'tidInBlock'e of(T)) { 562 | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | t group(groupi d(tid), nthreads(nthre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ha:d68s:)56,: tnote: iin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested hered InBlo c68k | ( t h r ePardiImdixt.ixv)e,s ,note: field 'group' will be initialized after field 'stepSize'0 , Prot o562, | 0 > ptriidm(st i d| ) ^, nthre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ha:d588s:(5n:t hnote: rin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested heree ads) ,588 | t i d I nrBulnoRcikn(gtu(pa(rggrso)u;p ) ,| ^ | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ##func, type, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.htid), n:t562h:r15e:a dwarning: sinitializer order does not match the declaration order [-Wreorder-ctor]( nthreads), tidInBlock(thread I562d | x . x ) ,t igdr(otuipd()g,r onutph)r,e a d| s ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~( n t| h tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)r eads), tidInBlock( t563h | r e a d Isdtxe.pxS)i,z eg(rnocucpl(Sghrmoeump.)c,o m m| . ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~b u f| f tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)S izes[N C563C | L _ P R OsTtOe_pSSIiMzPeL(En]c/cNlCSChLm_eSmT.EcPoSm/ms.ibzuefoffS(iTze)s)[ N{C C L| _ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~P R O| T group(groupO _SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 68| : group(group56 : note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primi/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ht:i68v:e56s:< Tnote: ,in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here RedOp ,68 | F a n S yPmrmiemtirtiicv<,T ,0 ,R ePdrOopt,o ,F a0n>S ypmrmiemtsr i c| < ^1 >,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :0588,: 5P:r onote: tin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested hereo , 0> 588p | r i m s r u| n ^R ing, ProtoSimple<2, 2>>' requested hereP rot o588> | ( a r g sr)u;n R i| n ^g in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here( args) ;202 | | ^ Run/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hW:o202r:k53E:l enote: min instantiation of member function 'RunWorkElement, 1, 2>::run' requested heree nt<(F)n.,r uTn,( wRee)d;O p ,| ^A lgo, Prot/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cppo:>12(:)1.:r unote: nin instantiation of member function 'RunWork, 1, 2>::run' requested here( we); 12 | | I ^M PL_COLL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cppF:U12N:C1(:A lnote: lin instantiation of member function 'RunWork, 1, 2>::run' requested hereR educ e12, | IRMIPNLG_,C OSLILM_PFLUEN,C (MAalxl,R eddouucbel,e )R I N| G^, SIMPLE,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :M391a:x95,: dnote: oexpanded from macro 'IMPL_COLL_FUNC'u ble) | ^ 391 | Ru/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hn:W391o:r95k:< nnote: cexpanded from macro 'IMPL_COLL_FUNC'c lFunc##f u391n | c , RtuynpWeo,r kFe,, NFCuCnLc_#A#LdGeOv_r#e#daolpgC,L _NPCRCOLT_OA_L#G#Op_r#o#taol>g(o),. rNuCnC(L&_nPcRcOlTSOh_m#e#mp.rwootrok>)(;) .\r u n| ( ^& ncclShmem.w/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:r562k:)15;: \note: field 'nthreads' will be initialized after field 'tidInBlock' | ^ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562t:i15d:( tnote: ifield 'nthreads' will be initialized after field 'tidInBlock'd ), nth r562e | a d s ( nttihdr(etaidds)),, ntthirdeIandBsl(onctkh(rtehardesa)d,I dtxi.dxI)n,B lgorcoku(pth(rgeraoduIpd)x,. x )| , ^~~~~~~~~~~~~~~~~ gro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:p562(:g60r:o unote: pfield 'group' will be initialized after field 'stepSize') , | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h562: | 562 : 60 : tnote: ifield 'group' will be initialized after field 'stepSize'd (tid) ,562 | n t h r etaidds((tnitdh)r,e andtsh)r,e atdisd(InntBhlroecakd(st)h,r etaiddIIdnxB.lxo)c,k (gtrhoruepa(dgIrdoxu.px)),, g| r ^~~~~~~~~~~o up(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidI 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tidIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx908. 13 warnings generated when compiling for gfx941. 13 warnings generated when compiling for gfx90a. 13 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ 13 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 13 warnings generated when compiling for gfx940. 13 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx906. 13 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 13 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for host. 13 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] In file included from 562 | tid(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cppt:id1): , In file included from n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ht:h10r: eIn file included from a/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.hd:s167(: nt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hh:r562e:a15d:s )warning: ,initializer order does not match the declaration order [-Wreorder-ctor] tidInBlock(threadIdx.x), group(grou p562) | , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t i d| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)t id), nt h563r | e a d s (snttehprSeiazdes()n,c ctliSdhImneBml.occokm(mt.hbruefafdSIidzxe.sx[)N,C CgLr_oPuRpO(TgOr_oSuIpM)P,L E ]| / ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~N C C| L tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)_ STEPS /563s | i z e o fs(tTe)p)S i{z e (| n ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~c c l| S group(grouph mem.comm.buffSizes[NCCL_PROTO_SIM/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hP:L68E:]56/:N Cnote: Cin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested hereL _STEP S68/ | s i z e oPfr(iTm)i)t i{v e s| < ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~T , | R group(groupe dOp, FanSymmetric<1>, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :note: 588in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here: 5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 68 | 588 | P r i mriutniRviensg<m(eatrrgisc)<;1 > ,| ^0 , Proto,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :0202>: 53p:r inote: min instantiation of member function 'RunWorkElement, 1, 2>::run' requested heres | ^ 202 | Ru/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hn:W588o:r5k:E lnote: ein instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested herem ent <588F | n , T ,r uRneRdiOnpg,< TA,l gRoe,d OPpr,o tPor>o(t)o.>r(uanr(gwse));; | | ^ ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::4202::153:: note: note: in instantiation of member function 'RunWork, 1, 2>::run' requested herein instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 4202 | | I M P L _ C O L LR_uFnUWNoCr(kAEllleRmeednutc (| )^. run(w/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:)391;: 95 :| ^note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp: 4391: | 1 : Rnote: uin instantiation of member function 'RunWork, 1, 2>::run' requested heren Work <4n | cIcMlPFLu_nCcO#L#Lf_uFnUcN,C (tAylpleR,e dFuucnec,# #RdIeNvGr,e dSoIpMM,i nN,C CiLn_tA8L_GtO)_ # #| a^l go, NC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hC:L391_:P95R:O Tnote: Oexpanded from macro 'IMPL_COLL_FUNC'_ ##proto> (391) | . r uRnu(n&Wnocrckl , N CtCiLd_(AtLiGdO)_,# #natlhgroe,a dNsC(CnLt_hPrReOaTdOs_)#,# ptriodtIon>B(l)o.crku(nt(h&rnecacdlISdhxm.exm).,w ogrrko)u;p (\g r o| u ^p ), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::562562::1560:: note: note: field 'nthreads' will be initialized after field 'tidInBlock'field 'group' will be initialized after field 'stepSize' 562562 | | ttiidd((ttiidd)),, nntthhrreeaaddss((nntthhrreeaaddss)),, ttiiddIInnBBlloocckk((tthhrreeaaddIIddxx..xx)),, ggrroouupp((ggrroouupp)),, | | ^~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().ru/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tn(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ idInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ cclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] type, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork15,: Nwarning: Cinitializer order does not match the declaration order [-Wreorder-ctor]C L_ALGO_##algo, NCCL_PROTO_ #562# | p r o t ot>i(d)(.triudn)(,& nnctchlrSehamdesm(.nwtohrrke)a;d s\) , | t ^i dInBlock(threadIdx.x), gr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:u562p:(15g:r onote: ufield 'nthreads' will be initialized after field 'tidInBlock'p ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 562 | 563 | t i ds(tteipdS)i,z en(tnhcrcelaSdhsm(enmt.hcroemamd.sb)u,f ftSiidzIensB[lNoCcCkL(_tPhRrOeTaOd_ISdIxM.PxL)E,] /gNrCoCuLp_(SgTrEoPuSp/)s,i z| e ^~~~~~~~~~~~~~~~~o f(T/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h):)562 :{60 : | note: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~field 'group' will be initialized after field 'stepSize' | group(group 562 | tid(tid), nthreads(nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hr:e68a:d56s:) ,note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested heret idInBl o68c | k ( t h rPeraidmIidtxi.vxe)s,< gTr,o uRpe(dgOrpo,u pF)a,n S y| m ^~~~~~~~~~~m etric<1>, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclSh/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ mem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize'/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid ),562 | n t h r etaidds((tnitdh)r,e andtsh)r,e atdisd(InntBhlroecakd(st)h,r etaiddIIdnxB.lxo)c,k (gtrhoruepa(dgIrdoxu.px)),, g| r ^~~~~~~~~~~o up(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h | ^~~~~~~~~~~ :562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx803. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ 17 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##al g562o | , N C CtLi_dP(RtOiTdO)_,# #nptrhorteoa>d(s)(.nrtuhnr(e&andcsc)l,S htmiedmI.nwBolrokc)k;( t\h r e| a ^d Idx.x), group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:g562r:o15u:p )note: ,field 'nthreads' will be initialized after field 'tidInBlock' | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 562 | 563t | i d ( t isdt)e,p Snitzher(enacdcsl(Snhtmherme.acdosm)m,. btuifdfISniBzleosc[kN(CtChLr_ePaRdOITdOx_.SxI)M,P LgEr]o/uNpC(CgLr_oSuTpE)P,S / s| i ^~~~~~~~~~~~~~~~~z eof/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:T562):)60 :{ note: field 'group' will be initialized after field 'stepSize'| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 562 | tid(tid), nthreads/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h(:n68t:h56r:e anote: din instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested heres ), ti d68I | n B l o cPkr(itmhirteiavdeIsd, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx803. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx941. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing17< warningTs, generated when compiling for Rgfx1102e. dOp, Proto>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:68:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 68 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:588:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 588 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ : warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, dat/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ a2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] d-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 655 : 11t:i dnote: (in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heret id), nt h655r | e a d s ( n t h r e apdrsi)m,s (ttiiddI-ntBildoSctka(rtthRreedaudcIed,x .nxT)h,r egardosuRpe(dgurcoeu,p )n,u l l| p ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t r ,| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)& direct -563> | o u t , satregpsS-i>zsee(nndcbculfSfh,m eamr.gcso-m>mr.ebcuvfbfuSfifz,e s [| N ^C CL_PROTO_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hS:I202M:P53L:E ]note: /in instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereN CCL_S T202E | P S / s i z e o fR(uTn)W)o r{k E l| e ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~m e n| t group(group< Fn, T, RedOp, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hA:l641g:o11,: Pnote: rin instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereo to>().ru n641( | w e ) ; | ^ prims/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp(:t4i:d1-:t inote: din instantiation of member function 'RunWork, 2, 2>::run' requested hereS tartR e4d | uIcMeP,L _nCTOhLrLe_aFdUsNRCe(dAulcleR,e dduicree,c tC-O>LdLoNwEnT,_ D&IdRiErCeTc,t -S>IoMuPtL,E ,a rSgusm-P>ossetnDdibvu,f fi,n ta8r_gts)- > r| e^c vbuff, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :| 391 ^: 95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: 391note: | in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here RunW o202r | k < n c c l F u nRcu#n#WfournkcE,l etmyepnet,< FFnu,n cT#,# dReevdrOepd,o pAP,r oNtCoC>L(_)A.LrGuOn_(#w#ea)l;g o ,| ^N CCL_PROTO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp_:#4#:p1r:o tnote: oin instantiation of member function 'RunWork, 2, 2>::run' requested here> ().ru n4( | &InMcPcLl_SChOmLeLm_.FwUoNrCk()A;l l\R e d| u ^c e, COLLNET/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h_:D562I:R15E:C Tnote: ,field 'nthreads' will be initialized after field 'tidInBlock' SIMPLE ,562 | S u m P otsitdD(itvi,d )i,n tn8t_htr)e a d| s^( nthre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ha:d391s:)95,: tnote: iexpanded from macro 'IMPL_COLL_FUNC'd InBlock( t391h | r e aRduIndWxo.rxk)<,n cgcrloFuupn(cg#r#ofuupn)c,, t| y ^~~~~~~~~~~~~~~~~p e, F/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:n562c:#60#:d enote: vfield 'group' will be initialized after field 'stepSize'r edop , NtCiCdL(_tAiLdG)O,_ #n#tahlrgeoa,d sN(CnCtLh_rPeRaOdTsO)_,# #tpirdoItnoB>l(o)c.kr(utnh(r&enacdcIldSxh.mxe)m,. wgorroku)p;( g\r o u| p), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ha:d562s:(15n:t hwarning: rinitializer order does not match the declaration order [-Wreorder-ctor]e ads), tidInBloc k562( | t h r e atdiIdd(xt.ixd)),, gnrtohurpe(agdrso(unpt)h,r e a| d ^~~~~~~~~~~~~~~~~s ), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:i562d:I60n:B lnote: ofield 'group' will be initialized after field 'stepSize'c k(thr e562a | d I d x .txi)d,( tgirdo)u,p (ngtrhoruepa)d,s ( n| t ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~h r e| a tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)d s), ti d563I | n B l o cskt(etphSriezaed(Indcxc.lxS)h,m egmr.ocuopm(mg.rbouufpf), | ^~~~~~~~~~~ Sizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:t562h:r15e:a dwarning: Iinitializer order does not match the declaration order [-Wreorder-ctor]d x.x), group(grou p562) | , | ^~~~~~~~~~~t id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ threads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/size/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ of(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->rec/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hv:b562u:f15f:, warning: initializer order does not match the declaration order [-Wreorder-ctor]| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: 562in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here | t i202d | ( t i d ) , n tRhurneWaodrsk(Enltehmreenatd)(,) .grruonu(pw(eg)r;o u p| ) ^, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T): 5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here563 | s5t | eIpMSPiLz_eC(OnLcLc_lFSUhNmCe(mA.lcloRmemd.ubcuef,f SCiOzLeLsN[ENTC_CDLI_RPERCOTT,O _SSIIMMPPLLEE,] /SNuCmCPLo_sStTDEiPvS,/ suiizneto8f_(tT)) ) | {^ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h group(group: 391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | R/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hu:n655W:o11r:k , FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herec clFunc# #655f | u n c , t y p e , pFruinmcs#(#tdiedv-rteiddoSptd,u cNeC,C Ln_TAhLrGeOa_d#s#Raeldguoc,e ,N CnCuLl_lPpRtOrT,O _&#d#iprreoctto->>(o)u.tr,u na(r&gnsc-c>lsSehnmdebmu.fwfo,r ka)r;g s\- > r| e ^c vbuff/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h,: 562 :| 15 ^: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h: 202562: | 53 : note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested heret id(t i202d | ) , n t h r e aRdusn(WnotrhkrEelaedmse)n,t r(o)u.pr(ugnr(owuep));, | | ^ ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp :note: 5field 'group' will be initialized after field 'stepSize': 1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 562 | 5 | tIiMdP(Lt_iCdO)L,L _nFtUhNrCe(aAdlsl(Rnetdhurceea,d sC)O,L LtNiEdTI_nDBIlRoEcCkT(,t hSrIeMaPdLIEd,x .Sxu)m,P ogsrtoDuipv(,g ruoiunpt)8,_ t )| ^~~~~~~~~~~ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h, :g562r:o15u:p (warning: ginitializer order does not match the declaration order [-Wreorder-ctor]r oup), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562 :56260 | : note: field 'group' will be initialized after field 'stepSize' tid(ti d562) | , n t htrieda(dtsi(dn)t,h rnetahdrse)a,d st(indtIhnrBelaodcsk)(,t htriedaIdnIBdlxo.cxk)(,t hgrreoaudpI(dgxr.oxu)p,) ,g r o| u ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~p ( g| r tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)o up), | 563 ^~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvb/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:ff562,: 15 :| ^warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here562 | t202i | d ( t i d ) , nRtuhnrWeoardksE(lnetmhernetax()),. rgurno(uwpe()g;r o u| p ^) , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T): 5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 563 | 5s | tIeMpPSLi_zCeO(LnLc_cFlUSNhCm(eAml.lcRoemdmu.cbeu,f fCSOiLzLeNsE[TN_CDCILR_EPCRTO,T OS_ISMIPMLPEL,E ]S/uNmCPCoLs_tSDTiEvP,S /usiinzte8o_ft()T ) )| ^{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h| : group(group391 :95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h: 677391: | 11 : Rnote: uin instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heren WorkT,h rNeCaCdLs_BAcLaGsOt_,# #&adligroe,c tN-C>CoLu_tP,R OdTiOr_e#c#tp-r>odtoow>n(,) .arrugns(-&>nscecnldSbhumfefm,. waorrgks)-;> r\e c v| b ^u ff, | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h ^: 562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53 :562 | note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here tid (202t | i d ) , n t h rReuandWso(rnktEhlreemaednst)<,F nt,i dTI,n BRleodcOkp(,t hArlegaod,I dPxr.oxt)o,> (g)r.oruupn((gwreo)u;p ) ,| ^ | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp::605:: 1note: :field 'group' will be initialized after field 'stepSize' note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 562 | 5 | I MtPiLd_(CtOiLdL)_,F UnNtCh(rAelaldRse(dnutcher,e aCdOsL)L,N EtTi_dDIInRBElCoTc,k (StIhMrPeLaEd,I dSxu.mxP)o,s tgDriovu,p (ugirnotu8p_)t,) | | ^~~~~~~~~~~^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunW/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | pr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::391562::9515:: note: warning: expanded from macro 'IMPL_COLL_FUNC'initializer order does not match the declaration order [-Wreorder-ctor] 391 | RunWo r562k | < n c c ltFiudn(ct#i#df)u,n cn,t htryepaed,s (Fnutnhcr#e#addesv)r,e dtoipdc,k (NtChCrLe_aAdLIGdOx_.#x#)a,l ggor,o uNpC(CgLr_oPuRpO)T,O _ #| # ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~p r o| t tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)o >().ru n563( | & n c c lsSthempeSmi.zweo(rnkc)c;l S\h m e| m ^. comm.b/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:f562f:S15i:z enote: sfield 'nthreads' will be initialized after field 'tidInBlock'[ NCCL_P R562O | T O _ S ItMiPdL(Et]i/dN)C,C Ln_tShTrEePaSd/ss(inztehorfe(aTd)s)) ,{ t i| d ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~I n B| l group(groupo ck(threadIdx.x), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hg:r641o:u11p:( gnote: rin instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereo up), | ^~~~~~~~~~~~~~~~~ 641 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 : 60 : note: field 'group' will be initialized after field 'stepSize' prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInB/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hl:o562c:k15(:t hwarning: rinitializer order does not match the declaration order [-Wreorder-ctor]e adIdx.x), group(grou p562) | , | ^~~~~~~~~~~~~~~~~t id(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:i562d:)60,: nnote: tfield 'group' will be initialized after field 'stepSize'h reads( n562t | h r e a dtsi)d,( ttiidd)I,n Bnltohcrke(atdhsr(enatdhIrdexa.dxs)),, gtrioduIpn(Bglroocukp()t,h r e| a ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~d I d| x tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T). x), gr o563u | p ( group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ er, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:i562d:(15t:i dwarning: )initializer order does not match the declaration order [-Wreorder-ctor], nthreads(nthreads), 562t | i d I n Btliodc(kt(itdh)r,e anthreads(ndtIhdrxe.axd)s,) ,g rtoiudpI(ngBrlooucpk)(,t h r| e ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~a d I| d tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)x .x), g r563o | u p ( g rsotuepp)S,i z e| ( ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~n c c| l tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)S hmem.c o563m | m . b u fsftSeipzSeisz[eN(CnCcLc_lPSRhOmTeOm_.ScIoMmPmL.Eb]u/fNfCSCiLz_eSsT[ENPCSC/Ls_iPzReOoTfO(_TS)I)M P{L E ]| / ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~N C C| L group(group_ STEPS/sizeof(T)) {/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 677| : ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~11 : | note: group(groupin instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | pr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hi:m641s:(11t:i dnote: -in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heret idStartB c641a | s t , n T h r e a dpsrBicmass(tt,i d&-dtiirdeSctta-r>toRuetd,u cdei,r encTth-r>edaodwsnR,e daurcges,- >dsiernedcbtu-f>fd,o wanr,g s&-d>irreeccvtb-u>fofu,t , | a ^r gs->send/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hb:u202f:f53,: anote: rin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereg s->re c202v | b u f f , | ^R unWorkE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hl:e202m:e53n:t , 2, 2>::run' requested heren , T, 202R | e d O p , A l gRou,n WPorroktEol>e(m)e.nrtu, 2, 2>::run' requested here> ().ru n8( | wIeM)P;L _ C| O ^L L_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuf/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hf:,562 : 15| : ^ warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 562 | 202 | t i d ( t iRdu)n,W onrtkhErleeamdesn(tnd(I)d.xr.uxn)(,w e); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALG/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hO:_562#:#15a:l gwarning: oinitializer order does not match the declaration order [-Wreorder-ctor], NCCL_PROTO_##pr o562t | o > ( ) .triudn((t&indc)c,l Snhtmherme.awdosr(kn)t;h r\e a d| s ^) , tidI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:B562l:o15c:k (note: tfield 'nthreads' will be initialized after field 'tidInBlock'h readId x562. | x ) , gtriodu(pt(igdr)o,u pn)t,h r e| a ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~d s (| n tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)t hreads )563, | t i d IsntBelpoScikz(et(hnrcecaldSIhdmxe.mx.)c,o mgmr.obuupf(fgSriozueps)[,N C C| L ^~~~~~~~~~~~~~~~~_ PR/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hO:T562O:_60S:I Mnote: Pfield 'group' will be initialized after field 'stepSize'L E]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuf/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hf:,562 : 15| : ^ warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | 562 | t i dR(utniWdo)r,k Enltehmreenatdr(e)a.drIudnx(.wxe)),; g r| o ^u p(group),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp : 8| : ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~1 : | note: tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)in instantiation of member function 'RunWork, 2, 2>::run' requested here 5638 | | I M P Ls_tCeOpLSLi_zFeU(NnCc(cAllSlhRmeedmu.cceo,m mC.ObLuLfNfESTi_zDeIsR[ENCCTC,L _SPIRMOPTLOE_,S ISMuPmLPEo]s/tNDCiCvL,_ SiTnEtP6S4/_sti)z e o| f^( T)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h): 391{: 95 :| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~note: expanded from macro 'IMPL_COLL_FUNC' | group(group 391 | RunWork, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here, type, F626u | n c # # d e v r epdroipm-,t iNdCSCtLa_rAtLSGcOa_t#t#earl,g on,T hNrCeCaLd_sPSRcOaTtOt_e#r#,p rNoUtLoL>,( )d.irruenc(t&-n>cucpl,S hamregms.-w>osrekn)d;b u\f f ,| ^a rgs->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:e562c:v15b:u fnote: ffield 'nthreads' will be initialized after field 'tidInBlock', | ^ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :t202i:d53(:t inote: din instantiation of member function 'RunWorkElement, 2, 2>::run' requested here) , nth r202e | a d s ( n t h r eRaudnsW)o,r ktEildeImneBnltou(p)).,r u n| ( ^~~~~~~~~~~~~~~~~w e)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h;: 562 :| 60 ^: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp: 8562: | 1 : note: in instantiation of member function 'RunWork, 2, 2>::run' requested heret id(ti d8) | ,I MnPtLh_rCeOaLdLs_(FnUtNhCr(eAaldlsR)e,d utcied,I nCBOlLoLcNkE(Tt_hDrIeRaEdCITd,x .SxI)M,P LgEr,o uSpu(mgProosutpD)i,v , | i ^~~~~~~~~~~n t64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | R/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:n562W:o15r:k , FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncclFunc##func, type, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROT/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hO:_562S:I15M:P Lwarning: Einitializer order does not match the declaration order [-Wreorder-ctor]] /NCCL_STEPS/sizeo f562( | T ) ) {t i d| ( ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~t i d| ) group(group, nthreads(nthreads), tidInBloc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hk:(666t:h9r:e anote: din instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereI dx.x), 666g | r o u p ( g r o uppr)i,m s (| t ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~i d ,| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)n Thread s563G | a t h e rs,t edpiSriezcet(-n>cucpl,S hNmUeLmL.,c oamrmg.sb-u>fsfeSnidzbeusf[fN,C CaLr_gPsR-O>TrOe_cSvIbMuPfLfE,] / N| C ^C L_STEPS/si/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hz:e202o:f53(:T )note: )in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 202 | | group(group RunWorkEleme/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hn:t687<:F11n:, note: Tin instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here, RedOp, A687l | g o , P r o t o > (p)r.irmusn((twied)-;t i d| S ^t artBcast/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp,: 9n:T1h:r enote: ain instantiation of member function 'RunWork, 2, 2>::run' requested hered sBcas t9, | I&MdPiLr_eCcOtL-L>_oFuUtN,C (nAullllRpetdru,c ea,r gCsO-L>LsNeEnT_dDbIuRfEfC,T ,a rSgIsM-P>LrEe,c vSbuumfPfo,s t D| i ^v , uint64/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h_:t202): 53 :| ^note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :202391 | : 95 : note: expanded from macro 'IMPL_COLL_FUNC' RunWor k391E | l e mReunntWF(u)n.cr#u#nd(ewver)e;d o p| < ^t ype>, NCCL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp_:A8L:G1O:_ #note: #in instantiation of member function 'RunWork, 2, 2>::run' requested herea lgo, N8C | CILM_PPLR_OCTOOL_L#_#FpUrNoCt(oA>l(l)R.erduunc(e&,n cCcOlLSLhNmEeTm_.DwIoRrEk); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ CT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidIn/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hB:l562o:c15k:( twarning: hinitializer order does not match the declaration order [-Wreorder-ctor]r eadIdx.x), group( g562r | o u p ) ,t i d| ( ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t i d| ) tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T), nthre a563d | s ( n t hsrteeapdSsi)z,e (tnicdcIlnSBhlmoecmk.(ctohmrme.abduIfdfxS.ixz)e,s [gNrCoCuLp_(PgRrOoTuOp_)S,I M P| L ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~E ] /| N tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)C CL_STE P563S | / s i z esotfe(pTS)i)z e{( n c| c ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~l S h| m group(groupe m.comm.buffSizes[NCCL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h_:P626R:O9T:O _note: Sin instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereI MPLE]/N C626C | L _ S T E P S / spirziemosf((tTi)d)-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , T, RedOp, Algo, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 43 warnings generated when compiling for gfx908. 43 warnings generated when compiling for gfx940. 43 warnings generated when compiling for gfx90a. 43 warnings generated when compiling for gfx90a. 43 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 43 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 43 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 43 warnings generated when compiling for host. 43 warnings generated when compiling for gfx906. 43 warnings generated when compiling for gfx1100. 43 warnings generated when compiling for gfx1101. 43 warnings generated when compiling for gfx1102. 43 warnings generated when compiling for gfx1030. 43 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h : 386 : 9 :u iwarning: nvariable 'wireOffset' set but not used [-Wunused-but-set-variable]t 64_t* ptr =386 | r e c v Pitnrt( 0w)i+rlelO1f2f8sOeftf s=e tW;i r e| W ^~~o rdPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadId/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hx:.562x:)15,: gwarning: rinitializer order does not match the declaration order [-Wreorder-ctor]o up(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 562 | 563 | t i d ( tsitde)p,S inzteh(rnecacdlsS(hnmtehmr.ecaodmsm).,b utfifdSIinzBelso[cNkC(CtLh_rPeRaOdTIOd_xS.IxM)P,L Eg]r/oNuCpC(Lg_rSoTuEpP)S,/ s i| z ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~e o f| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)T )) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~563 | | group(group stepSize(ncclShm/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.he:m626.:c9o:m mnote: .in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereb uffSize s626[ | N C C L _ P R O TpOr_iSmIsM(PtLiEd]-/tNiCdCSLt_aSrTtESPcSa/tstiezre,o fn(TTh)r)e a{d s S| c ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~a t t| e group(groupr , NULL, direct->up, a/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hr:g641s:-11>:s enote: nin instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here dbuff, a r641g | s - > r e c v b u f fp,r i m| s ^( tid-ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hd:S202t:a53r:t Rnote: ein instantiation of member function 'RunWorkElement, 2, 2>::run' requested hered uce, n202T | h r e a d s R e dRuucneW,o rdkiErleecmte-n>td oAultg,o ,a rPgrso-t>os>e(n)d.bruufnf(,w ea)r;g s -| > ^r ecvbuff,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp : 5| : ^1 : note: in instantiation of member function 'RunWork, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :5202 | :I53M:P Lnote: _in instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereC OLL_F U202N | C ( A l l R e d uRcuen,W oCrOkLELlNeEmTe_nDtI)( ) .| r^u n(we)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h;: 391 :| 95 ^: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp :3915 | : 1 :R unote: nin instantiation of member function 'RunWork, 2, 2>::run' requested hereW orkC,T ,N CSCILM_PALLEG,O _S#u#ma,l guoi,n tN8CC_Lt_)P R O| T^O _##pro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:o391>:(95):. rnote: uexpanded from macro 'IMPL_COLL_FUNC'n (&ncclSh m391e | m . wRournkW)o;r k\< n c| c ^l Func#/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h#:fu562n:c15,: tnote: yfield 'nthreads' will be initialized after field 'tidInBlock'p e, Fun c562# | # d e v rteiddo(ptn,t hNrCeCaLd_sA(LnGtOh_r#e#aadlsg)o,, tNiCdCILn_BPlRoOcTkO(_t#h#rperaodtIod>x(.)x.)r,u ng(r&onucpc(lgSrhomuepm).,w o r| k ^~~~~~~~~~~~~~~~~) ; \/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562| ^: 60: note: field 'group' will be initialized after field 'stepSize'/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:15: note: 562field 'nthreads' will be initialized after field 'tidInBlock' | ti d562( | t i d ) ,t indt(htrieda)d,s (nntthhrreeaaddss()n,t htriedaIdnsB)l,o ctki(dtIhnrBelaodcIkd(xt.hxr)e,a dgIrdoxu.px()g,r ogurp)o,u p (| g ^~~~~~~~~~~r oup), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h-:>562o:u15t:, warning: ninitializer order does not match the declaration order [-Wreorder-ctor]u llptr, args->send b562u | f f , atrigds(-t>irde)c,v bnutfhfr,e a d| s ^( nthread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hs:)202,: 53t:i dnote: Iin instantiation of member function 'RunWorkElement, 2, 2>::run' requested heren Block (202t | h r e a d I d x .Rxu)n,W ogrrkoEulpe(mgernotue(p)S.irzuen((nwcec)l;S h m| e ^m .comm.b/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppu:f4f:S1i:z enote: sin instantiation of member function 'RunWork, 2, 2>::run' requested here[ NCCL_ P4R | OITMOP_LS_ICMOPLLLE_]F/UNNCCC(LA_lSlTREePdSu/csei,z eCoOfL(LTN)E)T _{D I R| E ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~C T ,| group(groupS IMPLE, Sum, int8_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ht:)626 : 9| :^ note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95 :626 | note: expanded from macro 'IMPL_COLL_FUNC' pr i391m | s ( tRiudn-WtoirdkS-,> uNpC,C La_rAgLsG-O>_s#e#nadlbguof,f ,N CaCrLg_sP-R>OrTeOc_v#b#upfrfo,t o >| ( ^) .run(&n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hc:c202l:S53h:m enote: min instantiation of member function 'RunWorkElement, 2, 2>::run' requested here. work) ;202 | \ | ^ Ru/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:W562o:r15k:E lnote: efield 'nthreads' will be initialized after field 'tidInBlock'm ents(()n.trhurne(awdes));, t| i ^d InBlock(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppt:h5r:e1a:d Inote: din instantiation of member function 'RunWork, 2, 2>::run' requested herex .x), g5r | oIuMpP(Lg_rCoOuLpL)_,F U N| C ^~~~~~~~~~~~~~~~~( All/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hR:e562d:u60c:e ,note: field 'group' will be initialized after field 'stepSize'C OLLNET _562D | I R E C Tt,i dS(ItMiPdL)E,, nStuhmr,e audisn(tn8t_htr)e a d| s^) , tidIn/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hB:l391o:c95k:(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid( tid), note: nexpanded from macro 'IMPL_COLL_FUNC't hreads(nthreads), t i391d | I n BRluoncWko(rtkh, NCC L562_ | A L G O _t#i#da(ltgiod,) ,N CnCtLh_rPeRaOdTsO(_n#t#hprreoatdos>)(,) .triudnI(n&BnlcocclkS(htmherme.awdoIrdkx).;x )\, g| r ^o up(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, N/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hUL:L562,: 15a:r gwarning: sinitializer order does not match the declaration order [-Wreorder-ctor]- >sendbuff, args->rec v562b | u f f , t i| d ^( tid), n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:h202r:e53a:d snote: (in instantiation of member function 'RunWorkElement, 2, 2>::run' requested heren threa d202s | ) , t i d I n BRluoncWko(rtkhErleeamdeIndtx<.Fxn),, Tg,r oRuepd(Ogpr,o uApl)g,o , | P ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~r o t| o tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)> ().ru n563( | w e ) ; s t| e ^p Size(nc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppc:l5S:h1m:e mnote: .in instantiation of member function 'RunWork, 2, 2>::run' requested herec omm.b u5f | fISMiPzLe_sC[ONLCLC_LF_UPNRCO(TAOl_lSRIeMdPuLcEe],/ NCCOCLLL_NSETTE_PDSI/RsEiCzT,e oSfI(MTP)L)E ,{ S u| m ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~, u| i group(groupn t8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:: 626note: :expanded from macro 'IMPL_COLL_FUNC'9 : note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 391 | R626u | n W o r k < n c cplrFiumnsc(##tfiudn-ct,i dtSytpaer,t SFcuantct#e#rd,e vnrTehdroepat,t eNrC,C LN_UALLLG,O _d#i#raelcgto-,> uNpC,C La_rPgRsO-T>Os_e#n#dpbruoftfo,> (a)r.grsu-n>(r&enccvcbluSfhfm,e m .| w ^o rk); \ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :| 202 ^: 53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15 :202 | note: field 'nthreads' will be initialized after field 'tidInBlock' R562u | n W o r ktEilde(mteindt)<,F nn,t hTr,e aRdesd(Onpt,h rAelagdos,) ,P rtoitdoI>n(B)l.orcukn((twher)e;a d I| d ^x .x), gro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppu:p5(:g1r:o unote: pin instantiation of member function 'RunWork, 2, 2>::run' requested here) , | ^~~~~~~~~~~~~~~~~ 5 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hI:M562P:L60_:C Onote: Lfield 'group' will be initialized after field 'stepSize'L _FUNC( A562l | l R e d utcied,( tCiOdL)L,N EnTt_hDrIeRaEdCsT(,n tShIrMePaLdEs,) ,S utmi,d IuniBnlto8c_kt()t h r| e^a dIdx.x)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h,: 391g:r95o:u p(note: gexpanded from macro 'IMPL_COLL_FUNC'r oup), | ^~~~~~~~~~~391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx./usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tIn file included from id/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp(:t1i: dIn file included from )/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h,: 10n: tIn file included from h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.hr:e167a: d/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hs:(562n:t15h:r ewarning: ainitializer order does not match the declaration order [-Wreorder-ctor]d s), tidInBlock(t h562readIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_S/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hI:M562P:L15E:] /warning: Ninitializer order does not match the declaration order [-Wreorder-ctor]C CL_STEPS/sizeof(T)) {562 | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ t| i group(groupd (tid), nthreads(nt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hh:r666e:a9d:s )note: ,in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here tidInB l666o | c k ( t h r e a dpIrdixm.sx()t,i dg,r onuTph(rgeraoduspG)a,t h e| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, d| i tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)r ect->u p563, | N U L Ls,t eaprSgisz-e>(snecncdlbSuhfmfe,m .acrogmsm-.>bruefcfvSbiuzfefs,[ N C| C ^L _PROTO_S/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hI:M202P:L53E:] /note: Nin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereC CL_ST E202P | S / s izeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h.:x562):,15 :g rwarning: oinitializer order does not match the declaration order [-Wreorder-ctor]u p(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h ^~~~~~~~~~~: 562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.wor/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ k); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ o, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 :t15i:d (warning: tinitializer order does not match the declaration order [-Wreorder-ctor]i d), nthreads(n t562h | r e a d st)i,d (ttiiddI)n,B lnotchkr(etahdrse(andtIhdrxe.axd)s,) ,g rtoiudpI(ngBrlooucpk)(,t h r| e ^~~~~~~~~~~~~~~~~a dId/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hx:.562x:)60,: gnote: rfield 'group' will be initialized after field 'stepSize'o up(gro u562p | ) , | t ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~i d (| t tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)i d), nth r563e | a d s ( nsttherpeSaidzse)(,n ctcildSIhnmBelmo.ccko(mtmh.rbeuafdfISdixz.exs)[,N CgCrLo_uPpR(OgTrOo_uSpI)M,P L E| ] ^~~~~~~~~~~/ NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, dire/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hl:S562h:m15e:m .warning: winitializer order does not match the declaration order [-Wreorder-ctor]o rk); \ | ^ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :t562i:d15(:t inote: dfield 'nthreads' will be initialized after field 'tidInBlock') , nthrea d562s | ( n t h rteiadd(st)i,d )t,i dnItnhBrleoacdks((tnhtrheraedaIddsx).,x )t,i dgIrnoBulpo(cgkr(otuhpr)e,a d I| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~x . x| ) tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T), group (563g | r o u p )s,t e p| S ^~~~~~~~~~~~~~~~~i ze(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:c562c:l60S:h mnote: efield 'group' will be initialized after field 'stepSize'm .comm. b562u | f f S i zteisd[(NtCiCdL)_,P RnOtThOr_eSaIdMsP(LnEt]h/rNeCaCdLs_)S,T EtPiSd/IsniBzleoocfk((Tt)h)r e{a d I| d ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~x . x| ) group(group, group(group), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :| 641 ^~~~~~~~~~~: 11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS//usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hsi:z562e:o15f:( Twarning: )initializer order does not match the declaration order [-Wreorder-ctor]) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 562 | tid(tid)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h,: 666n:t9h:r enote: ain instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hered s(nthr e666a | d s ) , t i d IpnrBilmosc(kt(itdh,r enaTdhIrdexa.dxs)G,a tghreoru,p (dgirroeucpt)-,> u p| , ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ N U| L tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)L , args -563> | s e n d bsutfefp,S iazreg(sn-c>crleSchvmbeumf.fc,o m m| . ^b uffSize/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hs:[202N:C53C:L _note: Pin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereR OTO_S I202M | P L E ] / N C C LR_uSnTWEoPrSk/Esliezmeeonft(:(687):.11r:u nnote: (in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herew e); | ^ 687 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp : 5 : 1 : pnote: rin instantiation of member function 'RunWork, 2, 2>::run' requested herei ms(ti d5- | tIiMdPSLt_aCrOtLBLc_aFsUtN,C (nATlhlrReeadduscBec,a sCtO,L L&NdEiTr_eDcItR-E>CoTu,t ,S InMuPlLlEp,t rS,u ma,r gusi-n>ts8e_ntd)b u f| f^, args/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h-:>391r:e95c:v bnote: uexpanded from macro 'IMPL_COLL_FUNC'f f, | ^ 391 | Ru/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hn:W202o:r53k:< nnote: cin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herec lFunc #202# | f u n c , t y pReu,n WFournkcE#l#edmeevnrtee,d ONpC,C LA_lAgLoG,O _P#r#oatlog>o(,) .NrCuCnL(_wPeR)O;T O _| # ^# proto>(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp):.6r:u1n:( ¬e: nin instantiation of member function 'RunWork, 2, 2>::run' requested herec clShm e6m | .IwMoPrLk_)C;O L\L _ F| U ^N C(AllRe/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:u562c:e15,: Cnote: Ofield 'nthreads' will be initialized after field 'tidInBlock'L LNET_D I562R | E C T , tSiIdM(PtLiEd,) ,S unmt,h rienatd3s2(_ntt)h r e| a^d s), t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hi:d391I:n95B:l onote: cexpanded from macro 'IMPL_COLL_FUNC'k (threadI d391x | . x )R,u ngWroorukp<(ngcrcoluFpu)n,c # #| f ^~~~~~~~~~~~~~~~~u nc,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :t562y:p60e:, note: Ffield 'group' will be initialized after field 'stepSize'u nc##de v562r | e d o p i,d )N,C CnLt_hArLeGaOd_s#(#natlhgroe,a dNsC)C,L _tPiRdOITnOB_l#o#cpkr(otthor>e(a)d.Irduxn.(x&)n,c cglrSohumpe(mg.rwoourpk)),; \| ^~~~~~~~~~~ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hock(thr:e562a:d15I:d xwarning: .initializer order does not match the declaration order [-Wreorder-ctor]x ), group(group), | 562 ^~~~~~~~~~~~~~~~~ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :t562i:d60(:t inote: dfield 'group' will be initialized after field 'stepSize') , nthr e562a | d s ( n tthirde(atdisd)),, tnitdhIrneBaldosc(kn(tthhrreeaaddsI)d,x .txi)d,I ngBrlooucpk((gtrhoruepa)d,I d x| . ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~x ) ,| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)g roup(g r563o | u p ) , s t| e ^~~~~~~~~~~p Size(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInB/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hlock:(562t:h15r:e awarning: dinitializer order does not match the declaration order [-Wreorder-ctor]I dx.x), group(grou p562), | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ t i| d tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)( tid), n t563h | r e a d ss(tnetphSriezaed(sn)c,c ltSihdmIenmB.lcoocmkm(.tbhurfefaSdiIzdexs.[xN)C,C Lg_rPoRuOpT(Og_rSoIuMpP)L,E ] /| N ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~C C L| _ tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)S TEPS/s i563z | e o f ( Ts)t)e p{S i z| e ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~( n c| c group(groupl Shmem.comm.buff/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hS:i687z:e11s:[ Nnote: Cin instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereC L_PROTO _687S | I M P L E ] / N C C Lp_rSiTmEsP(St/isdi-zteiodfS(tTa)r)t B{c a s| t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~, n| T group(grouph readsBcast, &dire/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hc:t655-:>11o:u tnote: ,in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here nullptr ,655 | a r g s - > s e n d bpurfifm,s (atrigds--t>irdeSctvabrutfRfe,d u c| e ^, nThrea/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hd:s202R:e53d:u cnote: ein instantiation of member function 'RunWorkElement, 2, 2>::run' requested here, null p202t | r , & d i r e cRtu-n>Woourtk,E laermgesn-t>lrgeoc,v bPurfoft,o > (| ) ^. run(we)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h;: 202 :| 53 ^: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp: 5202: | 1 : note: in instantiation of member function 'RunWork, 2, 2>::run' requested here Ru n5W | oIrMkPELl_eCmOeLnLt_R(E)C.Tr,u nS(IwMeP)L;E , | S ^u m, uint/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp8:_7t:)1 : | note: ^in instantiation of member function 'RunWork, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :7391 | :I95M:P Lnote: _expanded from macro 'IMPL_COLL_FUNC'C OLL_FUN C391( | A l lRRuendWuocrek,< nCcOcLlLFNuEnTc_#D#IfRuEnCcT,, tSyIpMeP,L EF,u nScu#m#,d euvirnetd3o2p_^, NCCL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hA:L391G:O95_:# #note: aexpanded from macro 'IMPL_COLL_FUNC'l go, NCC L391_ | P R ORTuOn_W#o#rpkrl(F)u.nrcu#n#(f&unnccc,l Sthympeem,. wFournkc)#;# d\e v r| e ^d op:,15 :N Cnote: Cfield 'nthreads' will be initialized after field 'tidInBlock'L _ALGO_ #562# | a l g o ,t iNdC(CtLi_dP)R,O TnOt_h#r#epardost(on>t(h)r.eraudns()&,n ctcildSIhnmBelmo.cwko(rtkh)r;e a\d I d| x ^. x), gr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:u562p:(15g:r onote: ufield 'nthreads' will be initialized after field 'tidInBlock'p ), | ^~~~~~~~~~~~~~~~~ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 :t60i:d (note: tfield 'group' will be initialized after field 'stepSize'i d), nt h562r | e a d s (tnitdh(rteiadd)s,) ,n tthirdeIandBsl(onctkh(rtehardesa)d,I dtxi.dxI)n,B lgorcoku(pt(hgrreoaudpI)d,x . x| ) ^~~~~~~~~~~~~~~~~, gr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:u562p:(60g:r onote: ufield 'group' will be initialized after field 'stepSize'p ), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:p562):,15 : | warning: ^~~~~~~~~~~initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562562 | : 15 : warning: tinitializer order does not match the declaration order [-Wreorder-ctor]i d(tid), nthreads( n562t | h r e a dtsi)d,( ttiidd)I,n Bnltohcrke(atdhsr(enatdhIrdexa.dxs)),, gtrioduIpn(Bglroocukp()t,h r e| a ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~d I d| x tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T). x), g563r | o u p ( gsrtoeuppS)i,z e (| n ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~c c l| S tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)h mem.co m563m | . b u f fsStiezpeSsi[zNeC(CnLc_cPlRSOhTmOe_mS.IcMoPmLmE.]b/uNfCfCSLi_zSeTsE[PNSC/CsLi_zPeRoOfT(OT_)S)I M{P L E| ] ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~/ N C| C group(groupL _STEPS/sizeof(T)) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h{: 655 | : ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~11 : | note: group(groupin instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 641 :p11r:i mnote: sin instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here( tid-tidS t641a | r t R e d u c e , npTrhirmesa(dtsiRde-dtuicdeS,t anrutlRlepdturc,e ,& dniTrherceta-d>soRuetd,u caer,g sd-i>rseecntd-b>udfofw,n ,a r&gdsi-r>ercetc-v>bouuftf,, a r| g ^s ->sendbuf/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hf:,202 :a53r:g snote: -in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here> recvb u202f | f , | ^ RunWo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:k202E:l53e:m enote: nin instantiation of member function 'RunWorkElement, 2, 2>::run' requested heret e(n)t.note: (in instantiation of member function 'RunWork, 2, 2>::run' requested here) .run( w7e | )I;M P L| _ ^C OLL_FUN/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppC:(7A:l1l:R enote: din instantiation of member function 'RunWork, 2, 2>::run' requested hereu ce, C O7L | LINMEPTL__DCIORLELC_TF,U NSCI(MAPlLlER,e dSuucme,, uCiOnLtL3N2E_Tt_)D I R| E^C T, SIM/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hP:L391E:,95 :S unote: mexpanded from macro 'IMPL_COLL_FUNC', uint32_ t391) | | R^u nWorkn,c ,N CtCyLp_eA,L GFOu_n#c##a#ldgeov,r eNdCoCpL<_tPyRpOeT>O,_ #N#CpCrLo_tAoL>G(O)_.#r#uanl(g&on,c cNlCSChLm_ePmR.OwToOr_k#)#;p r\o t o| > ^( ).run(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:&562n:c15c:l Snote: hfield 'nthreads' will be initialized after field 'tidInBlock'm em.wor k562) | ; \ t| i ^d (tid),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :n562t:h15r:e anote: dfield 'nthreads' will be initialized after field 'tidInBlock's (nthre a562d | s ) , ttiiddI(ntBildo)c,k (ntthhrreeaaddIsd(xn.txh)r,e agdrso)u,p (tgirdoIunpB)l,o c k| ( ^~~~~~~~~~~~~~~~~t hre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ha:d562I:d60x:. xnote: )field 'group' will be initialized after field 'stepSize', group (562g | r o u p )t,i d (| t ^~~~~~~~~~~~~~~~~i d),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :n562t:h60r:e anote: dfield 'group' will be initialized after field 'stepSize's (nthre a562d | s ) , ttiiddI(ntBildo)c,k (ntthhrreeaaddIsd(xn.txh)reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm./usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , group(group), | ^~~~~~~~~~~ buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562| : ^15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 562 | 202 | t i d ( t i dR)u,n WnotrhkrEelaedmse(nnttI(d)x..rxu)n,( wger)o;u p (| g ^r oup), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp| : ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~6 : 1| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 563 | 6 | I M PsLt_eCpOSLiLz_eF(UnNcCc(lASlhlmReemd.uccoem,m .CbOuLfLfNSEiTz_eDsI[RNECCCTL,_ PSRIOMTPOL_ES,I MSPuLmE,] /iNnCtC3L2__StT)E P S| /^s izeof/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h(:T391):)95 :{ note: expanded from macro 'IMPL_COLL_FUNC'| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 391 | RunWor/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hk:<687n:c11c:l Fnote: uin instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heren c##func ,687 | t y p e , F u n c #p#rdiemvsr(etdiodp-a,r tNBCcCaLs_tA,L GnOT_h#r#eaaldgsoB,c aNsCtC,L _&PdRiOrTeOc_t#-#>poruott,o >n(u)l.lrputnr(,& nacrcglsS-h>mseemn.dwbourfkf),; a\r g s| - ^> recvb/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:f562f:,15 : | note: ^field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :562202 | : 53 : note: tin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herei d(tid )202, | n t h r e a d sR(unntWhorrekaEdlse)m,e nttiu(p)(.grruonu(pw)e,) ; | ^~~~~~~~~~~~~~~~~| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppfield 'group' will be initialized after field 'stepSize': 5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here562 | t5i | dI(MtPiLd_)C,O LnLt_hFrUeNaCd(sA(lnltRherdeuacdes,) ,C OtLiLdNIEnTB_lDoIcRkE(CtTh,r eSaIdMIPdLxE.,x )S,u mg,r ouuipn(tg8r_otu)p ) ,| ^ | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) p), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h562::56215::15 :warning: initializer order does not match the declaration order [-Wreorder-ctor]warning: initializer order does not match the declaration order [-Wreorder-ctor] 562562 | | ttiidd((ttiidd)),, nntthhrreeaaddss((nntthhrreeaaddss)),, ttiiddIInnBBlloocckk((tthhrreeaaddIIddxx..xx)),, ggrroouupp((ggrroouupp)),, | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | 563 | s tsetpeSpiSziez(en(cncclcSlhSmhemme.mc.ocmomm.mb.ubfuffSfiSziezse[sN[CNCCLC_LP_RPORTOOT_OS_ISMIPMLPEL]E/]N/CNCCLC_LS_TSETPESP/Ss/isziezoefo(fT()T)) ){ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group| group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h::641655::1111:: note: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herein instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641655 | | pprriimmss((ttiidd--ttiiddSSttaarrttRReedduuccee,, nnTThhrreeaaddssRReedduuccee,, dniurlelcptt-r>,d o&wdni,r e&cdti-r>eocutt-,> oaurtg,s -a>rsgesn-d>bsuefnfd,b uafrfg,s -a>rrgesc-v>bruefcfv,b u f| f ^, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h53::202 :note: 53in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | 202 | R u n WRournkWEolrekmEelnetmo(t)o.>r(u)n.(rwuen)(;w e )| ; ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp1::7 :note: 1in instantiation of member function 'RunWork, 2, 2>::run' requested here: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | I M7P | LI_MCPOLL_LC_OFLULN_CF(UANlCl(RAeldluRceed,u cCeO,L LCNOELTL_NDEITR_EDCITR,E CSTI,M PSLIEM,P LSEu,m ,S uimn,t 3u2i_ntt)3 2 _| t^) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h95::391 :note: 95expanded from macro 'IMPL_COLL_FUNC': note: expanded from macro 'IMPL_COLL_FUNC' 391 | 391R | u n WRournkWy,p eN>C,C LN_CACLLG_OA_L#G#Oa_l#g#oa,l gNoC,C LN_CPCRLO_TPOR_O#T#Op_r#o#tpor>o(t)o.>r(u)n.(r&unnc(c&lnSchcmleSmh.mweomr.kw)o;r k\) ; | \ ^ | ^/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:15:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :note: 562field 'nthreads' will be initialized after field 'tidInBlock': 15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | 562t | i d ( t itdi)d,( tnitdh)r,e andtsh(rnetahdrse(andtsh)r,e atdisd)I,n BtliodcIkn(Btlhorceka(dtIhdrxe.axd)I,d xg.rxo)u,p (ggrroouupp()g,r o u| p ^~~~~~~~~~~~~~~~~) , /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h| : ^~~~~~~~~~~~~~~~~562 :60:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :note: 562field 'group' will be initialized after field 'stepSize': 60: note: field 'group' will be initialized after field 'stepSize' 562 | 562ti | d ( t i dt)i,d (nttihdr)e,a dnst(hnrtehardesa(dnst)h,r etaiddsI)n,B ltoicdkI(ntBhlroecakd(Itdhxr.exa)d,I dgxr.oxu)p,( ggrroouupp)(,g r o| u ^~~~~~~~~~~p ), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork ,warning: initializer order does not match the declaration order [-Wreorder-ctor]N CCL_ALGO_##algo, NC C562L | _ P R O TtOi_d#(#tpirdo)t,o >n(t)h.rreuand(s&(nnctchlrSehamdesm).,w otrikd)I;n B\l o c| k ^( thread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hI:d562x:.15x:) ,note: field 'nthreads' will be initialized after field 'tidInBlock'g roup(g r562o | u p ) , t i| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~( t i| d tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) , nthr e563a | d s ( n tshtreepaSdisz)e,( ntcicdlISnhBmleomc.kc(otmhmr.ebaudfIfdSxi.zxe)s,[ NgCrCoLu_pP(RgOrToOu_pS)I,M P L| E ^~~~~~~~~~~~~~~~~] /NC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hC:L562_:S60T:E Pnote: Sfield 'group' will be initialized after field 'stepSize'/ sizeof (562T | ) ) { t i| d ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~( t i| d group(group) , nthreads(nthreads)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h,: 687t:i11d:I nnote: Bin instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herel ock(thr e687a | d I d x . x ) , g rporuipm(sg(rtoiudp-)t,i d S| t ^~~~~~~~~~~a rtBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h, Sum, i:n562t:3152:_ twarning: )initializer order does not match the declaration order [-Wreorder-ctor] | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 562 | 391t | i d (RtuindW)o,r kn,, gNrCoCuLp_(AgLrGoOu_p#)#,a l g| o ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, N| C tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)C L_PROT O563_ | # # p r osttoe>p(S)i.zreu(nn(c&cnlcSchlmSehmm.ecmo.mwmo.rbku)f;f S\i z e| s ^[ NCCL_P/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hR:O562T:O15_:S Inote: Mfield 'nthreads' will be initialized after field 'tidInBlock'P LE]/NC C562L | _ S T E PtSi/ds(itziedo)f,( Tn)t)h r{e a d| s ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~( n t| h group(groupr eads), tidInBlock(thre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ha:d687I:d11x:. xnote: )in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here, group(g r687o | u p ) , | ^~~~~~~~~~~~~~~~~ p/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:i562m:s60(:t inote: dfield 'group' will be initialized after field 'stepSize'- tidSta r562t | B c a s tt,i dn(Tthirde)a,d snBtcharseta,d s&(dnitrherceta-d>so)u,t ,t induIlnlBpltorc,k (atrhgrse-a>dsIednxd.bxu)f,f ,g raorugps(-g>rroeucpv)b,u f f| , ^~~~~~~~~~~ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hC:O562L:L15N:E Twarning: _initializer order does not match the declaration order [-Wreorder-ctor]D IRECT, SIMPLE, Sum ,562 | i n t 6 4t_itd)( t id| )^, nthre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ha:d391s:(95n:t hnote: rexpanded from macro 'IMPL_COLL_FUNC'e ads), ti d391I | n B lRoucnkW(otrhkr , NsCtCeLp_SAiLzGeO(_n#c#callSghom,e mN.CcCoLm_mP.RbOuTfOf_S#i#zperso[tNoC>C(L)_.PrRuOnT(O&_nScIcMlPSLhEm]e/mN.CwCoLr_kS)T;E P\S / s| i ^z eof(T)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h): 562{: 15 :| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~note: field 'nthreads' will be initialized after field 'tidInBlock' | group(group 562 | tid(tid),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :n655t:h11r:e anote: din instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heres (nthrea d655s | ) , t i d I n B l opcrki(mtsh(rteiadd-Itdixd.Sxt)a,r tgRreoduupc(eg,r onuTph)r,e a d| s ^~~~~~~~~~~~~~~~~R edu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hc:e562,: 60n:u lnote: lfield 'group' will be initialized after field 'stepSize'p tr, &d i562r | e c t - >toiudt(,t iadr)g,s -n>tshernedabdusf(fn,t harregasd-s>)r,e ctvibduIfnfB,l o c| k ^( threadI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hd:x202.:x53):, note: gin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herer oup(g r202o | u p ) , | ^~~~~~~~~~~ RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ unc, type, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:391::56295::15 :note: expanded from macro 'IMPL_COLL_FUNC'warning: initializer order does not match the declaration order [-Wreorder-ctor] 391 | RunWorkn,B lNoCcCkL(_tAhLrGeOa_d#I#daxl.gxo),, NgCrCoLu_pP(RgOrToOu_p#)#,p r o| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t o >| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) .run(&n c563c | l S h m esmt.ewpoSrikz)e;( n\c c l| S ^h mem.co/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hm:m562.:b15u:f fnote: Sfield 'nthreads' will be initialized after field 'tidInBlock'i zes[NC C562L | _ P R O TtOi_dS(ItMiPdL)E,] /nNtChCrLe_aSdTsE(PnSt/hsriezaedosf)(,T )t)i d{I n B| l ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~o c k| ( group(groupt hreadIdx.x), group(gr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ho:u666p:)9,: note: | in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562 :66660 | : note: field 'group' will be initialized after field 'stepSize' pr i562m | s ( t i dt,i dn(Tthirdea)d,s Gnatthhreera,d sd(inrtehcrte-a>dusp),, NtUiLdLI,n Balrogcsk-(>tshernedabduIfdfx,. xa)r,g sg-r>oruepc(vgbruofufp,) , | ^ | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:i562d:I15n:B lwarning: oinitializer order does not match the declaration order [-Wreorder-ctor]c k(threadIdx.x) ,562 | g r o u pt(igdr(otuipd)),, n| t ^~~~~~~~~~~h reads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 : 15p:r iwarning: minitializer order does not match the declaration order [-Wreorder-ctor]s (tid, nThreadsGathe r562, | d i r etcitd-(>tuipd,) ,N UnLtLh,r eaardgss(-n>tshernedabdusf)f,, tairdgIsn-B>lroecckv(btuhfrfe,a d I| d ^x .x),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :g202r:o53u:p note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:g562r:o15u:p )warning: ,initializer order does not match the declaration order [-Wreorder-ctor] | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: 562field 'group' will be initialized after field 'stepSize' | ti d562( | t i d ) ,t indt(htrieda)d,s (nntthhrreeaaddss()n,t htriedaIdnsB)l,o ctki(dtIhnrBelaodcIkd(xt.hxr)e,a dgIrdoxu.px()g,r ogurpo)u,p ( g| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~o u p| ) tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T), | ^~~~~~~~~~~ 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h| : ^~~~~~~~~~~~~~~~~562 :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | ti d562( | t i d ) ,t indt(htrieda)d,s (nntthhrreeaaddss()n,t htriedaIdnsB)l,o ctki(dtIhnrBelaodcIkd(xt.hxr)e,a dgIrdoxu.px()g,r ogurpo)u,p ( g| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~o u p| ) tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T), | ^~~~~~~~~~~ 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hN:C562C:L15_:A Lwarning: Ginitializer order does not match the declaration order [-Wreorder-ctor]O _##algo, NCCL_ P562R | O T O _ #t#ipdr(ottiod>)(,) .nrtuhnr(e&andcsc(lnSthhmreema.dws)o,r kt)id;I n\B l o| c ^k (thread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hI:d562x:.15x:) ,note: field 'nthreads' will be initialized after field 'tidInBlock'g roup(g r562o | u p ) , t i| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~( t i| d tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) , nthr e563ad | s ( n t hsrteeapdSsi)z,e (tnicdcIlnSBhlmoecmk.(ctohmrme.abduIfdfxS.ixz)e,s [gNrCoCuLp_(PgRrOoTuOp_)S,I M P| L ^~~~~~~~~~~~~~~~~E ]/N/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hC:C562L:_60S:T Enote: Pfield 'group' will be initialized after field 'stepSize'S /sizeo f562( | T ) ) {t i d| ( ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~t i d| ) group(group, nthreads(nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hr:e677a:d11s:) ,note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heret idInBloc k677( | t h r e a d I d x . xp)r,i mgsr(otuipd(-gtrioduSpt)a,r t B| c ^~~~~~~~~~~a st, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, d/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hi:r562e:c15t:- >warning: uinitializer order does not match the declaration order [-Wreorder-ctor]p , args->sendbuff, 562a | r g s - >triedc(vtbiudf)f,, n t| h ^r eads(n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:h202r:e53a:d snote: )in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here, tidI n202B | l o c k ( t h r eRaudnIWdoxr.kxE)l,e mgernotu ( ) . rsutne(pwSei)z;e ( n| c ^c lShmem.c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppo:m7m:.1b:u fnote: fin instantiation of member function 'RunWork, 2, 2>::run' requested hereS izes[ N7C | CILMP_LP_RCOOTLOL__SFIUMNPCL(EA]l/lNRCeCdLu_ce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :687562 | : 15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] prims(tid- t562i | d S t a rttiBdc(atsitd,) ,n TnhtrheraedasdBsc(anstth,r e&addisr)e,c tt-i>doIuntB,l oncukl(ltphtrre,a daIrdgxs.-x>)s,e ngdrbouufpf(,g raorugps)-,> r e| c ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~v b u| f tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)f , | ^ 563 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :s202t:e53p:S inote: zin instantiation of member function 'RunWorkElement, 2, 2>::run' requested heree (nccl S202h | m e m . c o m m .RubnuWfofrSkiEzleesm[eNnCtC/(s)i.zreuonf((wTe))); { | ^| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :7687 | :I11M:P Lnote: _in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereC OLL_FUN C687( | A l l R e d u c e , pCrOiLmLsN(EtTi_dD-ItRiEdCSTt,a rStIBMcPaLsEt,, SnuTmh,r euaidnstB3c2a_stt), &| d^i rect->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ho:u391t:,95 :n unote: expanded from macro 'IMPL_COLL_FUNC'l lptr, ar g391s | - > sReunndWbourfkf<,n cacrlgFsu-n>cr#e#cfvubnucf,f ,t y p| e ^, Func##/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hd:e202v:r53e:d onote: pin instantiation of member function 'RunWorkElement, 2, 2>::run' requested here< type> ,202 | N C C L_ A L G O _R#u#naWlogrok,E lNeCmCeLn_tP,( )A.lrguon,( &PnrcoctloS>h(m)e.mr.uwno(rwke));; \ | ^| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::7562::115:: note: note: in instantiation of member function 'RunWork, 2, 2>::run' requested herefield 'nthreads' will be initialized after field 'tidInBlock' 7 | 562I | M P L _ CtOiLdL(_tFiUdN)C,( AnltlhRreedaudcse(,n tChOrLeLaNdEsT)_,D ItRiEdCITn,B lSoIcMkP(LtEh,r eSaudmI,d xu.ixn)t,3 2g_rto)u p (| g^r oup),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 391| : ^~~~~~~~~~~~~~~~~95 : note: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hexpanded from macro 'IMPL_COLL_FUNC': 562:60: note: field 'group' will be initialized after field 'stepSize' 391 | R u562n | W o r k h,r eNaCdCILd_xA.LxG)O,_ #g#raolugpo(,g rNoCuCpL)_,P R O| T ^~~~~~~~~~~O _##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h 563 | :s562t:e15p:S iwarning: zinitializer order does not match the declaration order [-Wreorder-ctor]e (ncclShmem.comm.buf f562S | i z e s [tNiCdC(Lt_iPdR)O,T On_tShIrMePaLdEs](/nNtChCrLe_aSdTsE)P,S /tsiidzIenoBfl(oTc)k)( t{h r e| a ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~d I d| x group(group. x), group(g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hr:o687u:p11):, note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 687 | 563 | s t e ppSriizmes((ntcicdl-SthimdeSmt.acrotmBmc.absutf,f SniTzherse[aNdCsCBLc_aPsRtO,T O&_dSiIrMePcLtE-]>/oNuCtC,L _nSuTlElPpSt/rs,i zaerogfs(-T>)s)e n{d b u| f ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~f , | a group(groupr gs->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::677202::1153:: note: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herein instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | 677 | R u n WporrikmEsl(etmiedn-ttt(,) .&rduinr(ewcet)-;> o u| t ^, direc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppt:-8>:d1o:w nnote: ,in instantiation of member function 'RunWork, 2, 2>::run' requested here args- >8s | eInMdPbLu_fCfO,L La_rFgUsN-C>(rAelclvRbeudfufc,e , | C ^O LLNET_D/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hI:R202E:C53T:, note: Sin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereI MPLE, 202S | u m , i n t 6 4R_utn)W o r| k^E lemen/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:<391F:n95,: Tnote: ,expanded from macro 'IMPL_COLL_FUNC' RedOp, A391l | g o ,R uPnrWootrok><(n)c.crluFnu(nwce#)#;f u n| c ^, type, F/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppu:n7c:#1#:d enote: vin instantiation of member function 'RunWork, 2, 2>::run' requested herer edop< t7y | pIeM>P,L _NCCOCLLL__AFLUGNOC_(#A#lallRgeod,u cNeC,C LC_OPLRLONTEOT__#D#IpRrEoCtTo,> (S)I.MrPuLnE(,& nScucml,S humienmt.3w2o_rtk)) ; | \^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h391::56295::15 :note: expanded from macro 'IMPL_COLL_FUNC'note: field 'nthreads' will be initialized after field 'tidInBlock' 391562 | | R u ntWiodr(kt(I,td ixNd.C)xC,)L ,_n AtgLhrGroOeu_ap#d(#sga(rlnogtuohp,r) e,Na Cd Cs| L) ^~~~~~~~~~~~~~~~~_, P Rt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hOi:Td562OI:_n60#B:#l ponote: rcfield 'group' will be initialized after field 'stepSize'ok t(ot>h( r)562e. | ar du In d( x&t.nixcd)c(,lt Sighdrm)oe,um p.n(wtgohrrrokeu)ap;d) s,\( n t| | h ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ ^r e a| d tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h ):,562 : t15563i: | d Inote: nfield 'nthreads' will be initialized after field 'tidInBlock' B lsotc ek562p( | St ih zr ee (atndicIdcd(lxtS.ihxdm))e,,m .gncrtoohmurmpe.(abgdursfo(funSpti)hz,re es a[| dN ^~~~~~~~~~~sC )C,L _tPiRdOITnOB_lSoIcMkP(LtEh]r/eNaCdCILd_xS.TxE)P,S /gsriozuepo(fg(rTo)u)p ){, | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~~~~~~~ | group(group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:60: note: field 'group' will be initialized after field 'stepSize' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 677t:i11d:( tnote: iin instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hered ), nthr e677a | d s ( n t h r e a d sp)r,i mtsi(dtIindB-ltoicdkS(ttahrrteBacdaIsdtx,. xn)T,h rgeraoduspB(cgarsotu,p )&,d i r| e ^~~~~~~~~~~c t->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_#/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h#:al562g:o15,: Nwarning: Cinitializer order does not match the declaration order [-Wreorder-ctor]C L_PROTO_##proto>().r u562n | ( & n c ctliSdh(mteimd.)w,o rnkt)h;r e\a d s| ( ^n thread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hs:)562,: 15t:i dnote: Ifield 'nthreads' will be initialized after field 'tidInBlock'n Block( t562h | r e a dtIiddx(.txi)d,) ,g rnotuhpr(egardosu(pn)t,h r e| a ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~d s )| , tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) tidInB l563o | c k ( t hsrteeapdSIidzxe.(xn)c,c lgSrhomuepm(.gcroomump.)b,u f f| S ^~~~~~~~~~~~~~~~~i zes/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h[:N562C:C60L:_ Pnote: Rfield 'group' will be initialized after field 'stepSize'O TO_SIM P562L | E ] / N CtCiLd_(StTiEdP)S,/ snitzheroefa(dTs)()n t{h r e| a ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ d s| ) group(group, tidInBlock(threadI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hd:x641.:x11):, note: gin instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herer oup(gro u641p | ) , | ^~~~~~~~~~~ prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::15391:: 95warning: :initializer order does not match the declaration order [-Wreorder-ctor] note: expanded from macro 'IMPL_COLL_FUNC' 391 | 562R | u n W o rtkir,e aNdCICdLx_.AxL)G,O _g#r#oaulpg(og,r oNuCpC)L,_ P R| O ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~T O _| # tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)# proto> (563) | . r u n (s&tnecpcSliSzhem(enmc.cwloSrhkm)e;m .\c o m| m ^. buffSiz/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:s562[:N15C:C Lnote: _field 'nthreads' will be initialized after field 'tidInBlock'P ROTO_S I562M | P L E ] /tNiCdC(Lt_iSdT)E,P Sn/tshirzeeaodfs((Tn)t)h r{e a d| s ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~) , | t group(groupi dInBlock(threadId/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hx:.641x:)11,: gnote: rin instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereo up(grou p641) | , | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 :p60r:i mnote: sfield 'group' will be initialized after field 'stepSize'( tid-ti d562S | t a r t Rteiddu(ctei,d )n,T hnrtehardesaRdesd(uncteh,r edaidrse)c,t -t>iddIonwBnl,o c&kd(itrherceta-d>Iodux.tx,) ,a rggrso-u>ps(egnrdobuupf)f,, a| r ^~~~~~~~~~~g s->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lgo, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :p562r:i15m:s (warning: tinitializer order does not match the declaration order [-Wreorder-ctor]i d-tidStartScatter, n562T | h r e a dtsiSdc(attitde)r,, nNtUhLrLe,a ddsi(rnetchtr-e>audps,) ,a rtgisd-I>nsBelnodcbku(ftfh,r eaardgIsd-x>.rxec)v,b ugfrfo,u p (| g ^r oup), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :| 202 ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~: 53 :| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 563202 | | s t e p SRiuzneW(onrckcEllSehmmeenmt.S(I)M.PrLuEn](/wNeC)C;L _ S| T ^E PS/sizeo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppf:(7T:)1): {note: in instantiation of member function 'RunWork, 2, 2>::run' requested here | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group7 | IMPL_COLL_FUNC(AllRe/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hd:u687c:e11,: Cnote: Oin instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereL LNET_DI R687E | C T , S I M P L E ,p rSiumms,( tuiidn-tt3i2d_Stt)a r t| B^c ast, n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hT:h391r:e95a:d snote: Bexpanded from macro 'IMPL_COLL_FUNC'c ast, &di r391e | c t -R>uonuWto,r kncs,e ntdybpuef,f ,F uanrcg#s#-d>ervercevdboupf ^, NCCL_A/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hL:G202O:_53#:# anote: lin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereg o, NC C202L | _ P R O T O _ # #RpurnoWtoor>k(E)l.ermuenn(t&()/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h.:r562u:n15(:w enote: )field 'nthreads' will be initialized after field 'tidInBlock'; | ^ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp :t7i:d1(:t inote: din instantiation of member function 'RunWork, 2, 2>::run' requested here) , nth r7e | aIdMsP(Ln_tChOrLeLa_dFsU)N,C (tAildlIRneBdluoccek,( tChOrLeLaNdEITd_xD.IxR)E,C Tg,r oSuIpM(PgLrEo,u pS)u,m , | u ^~~~~~~~~~~~~~~~~i nt3/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h2:_562t:)60 : | note: ^field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :562391 | : 95 : note: texpanded from macro 'IMPL_COLL_FUNC'i d(tid), n391t | h r eRaudnsW(onrtkhp,) ,N C C| L ^~~~~~~~~~~_ ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::562562::6015:: note: warning: field 'group' will be initialized after field 'stepSize'initializer order does not match the declaration order [-Wreorder-ctor] 562 | ti d562( | t i d ) ,t indt(htrieda)d,s (nntthhrreeaaddss()n,t htriedaIdnsB)l,o ctki(dtIhnrBelaodcIkd(xt.hxr)e,a dgIrdoxu.px()g,r ogurpo)u,p ( g| r ^~~~~~~~~~~o up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hdx:.562x:)15,: gwarning: rinitializer order does not match the declaration order [-Wreorder-ctor]o up(group), | ^~~~~~~~~~~~~~~~~ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 :t60i:d (note: tfield 'group' will be initialized after field 'stepSize'i d), nt h562r | e a d s (tnitdh(rteiadd)s,) ,n tthirdeIandBsl(onctkh(rtehardesa)d,I dtxi.dxI)n,B lgorcoku(pt(hgrreoaudpI)d,x . x| ) ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, g| r tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)o up(grou p563) | , | ^~~~~~~~~~~s tepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(thread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Idx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, ar/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buf/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ gs->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:e562a:d15s:) ,warning: initializer order does not match the declaration order [-Wreorder-ctor]t idInBlock(threa d562I | d x . x )t,i dg(rtoiudp)(,g rnotuhpr)e,a d s| ( ^~~~~~~~~~~~~~~~~n thr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:a562d:s60):, note: tfield 'group' will be initialized after field 'stepSize'i dInBlo c562k | ( t h r etaiddI(dtxi.dx)),, ngtrhoruepa(dgsr(onutph)r,e a d| s ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~) , | t tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)i dInBloc k563( | t h r e asdtIedpxS.ixz)e,( ngcrcoluSph(mgermo.ucpo)m,m . b| u ^~~~~~~~~~~f fSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ fSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(thre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_F/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hU:N562C:(15A:l lwarning: Rinitializer order does not match the declaration order [-Wreorder-ctor]e duce, COLLNET _562D | I R E C Tt,i dS(ItMiPdL)E,, nStuhmr,e audisn(tn6t4h_rte)a d s| )^, tidI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hn:B391l:o95c:k (note: texpanded from macro 'IMPL_COLL_FUNC'h readIdx. x391) | , gRruonuWpo(rgkr,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h NCCL_:AL562G:O15_:# #warning: ainitializer order does not match the declaration order [-Wreorder-ctor]l go, NCCL_PROTO_##pro t562o | > ( ) . rtuind((&tnicdc)l,S hnmtehmr.ewaodrsk()n;t h\r e a| d ^s ), ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:I562n:B15l:o cnote: kfield 'nthreads' will be initialized after field 'tidInBlock'( thread I562d | x . x ) ,t igdr(otuipd()g,r onutph)r,e a d| s ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~( n t| h tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)r eads), 563t | i d I n BsltoecpkS(itzher(enacdcIldSxh.mxe)m,. cgormomu.pb(ugfrfoSuipz)e,s [ N| C ^~~~~~~~~~~~~~~~~C L_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hP:R562O:T60O:_ Snote: Ifield 'group' will be initialized after field 'stepSize'M PLE]/N C562C | L _ S T EtPiSd/(stiizde)o,f (nTt)h)r e{a d s| ( ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~n t h| r group(groupe ads), tidInBlock(threadId/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hx:.641x:)11,: gnote: rin instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereo up(group )641, | | ^~~~~~~~~~~ prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd), nt:h562r:e15a:d swarning: (initializer order does not match the declaration order [-Wreorder-ctor]n threads), tidInBlock(t h562r | e a d I dtxi.dx()t,i dg)r,o unpt(hgrreoaudps)(,n t h| r ^~~~~~~~~~~e ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL_ALGO_##:a562l:g15o:, warning: Ninitializer order does not match the declaration order [-Wreorder-ctor]C CL_PROTO_##proto>().run (562& | n c c l Sthimde(mt.iwdo)r,k )n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h;t: h562\r: e15 a:| d ^swarning: (initializer order does not match the declaration order [-Wreorder-ctor]n t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hh:r562e:a15d:s )note: ,field 'nthreads' will be initialized after field 'tidInBlock' t i562d | I 562n | B l ot ci kdt((ittdhi(rdte)ia,dd )In,dt xhn.rtxeh)ar,de sag(drnsot(uhnprt(ehgarrdeosau)dp,s) ),t, i dt| Ii ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~nd BI ln| oB tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)cl ko(ctk h(563rt | eh ar de Ia ddsxIt.dexxp).S,xi )zg,er (ognurcpoc(ulgpSr(hogmurepom)u.,pc )o ,m| m ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ . | b ^~~~~~~~~~~~~~~~~u| f tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)f/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h S:i562z:e60s :[563 N | note: C field 'group' will be initialized after field 'stepSize'C L _ Ps Rt562Oe | Tp OS _i Sz IetM(iPndLc(Ect]li/SdNh)Cm,Ce Lmn_.tSchTorEmePmaS.d/bssu(ifnzfteShoirfze(eaTsd)[s)N) C,{C Lt _i| Pd ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~RI On TB| Ol group(group_o ScIkM(PtLhEr]e/aNdC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hIC:dL626x_:.S9xT:)E ,Pnote: Sin instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereg/ rsoiuzp e(626og | fr (o Tu )p )) , { | p| ^~~~~~~~~~~r ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ i m s| ( group(groupt id-tidStartScatter,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :n655T:h11r:e anote: din instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heres Scatter ,655 | N U L L , d i r e cptr-i>musp(,t iadr-gtsi-d>SsteanrdtbRuefdfu,c ea,r gnsT-h>rreeacdvsbRuefdfu,c e ,| ^n ullptr, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h&:d202i:r53e:c tnote: -in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here> out, a202r | g s - > s e n d bRuufnfW,o rakrEglse-m>ernetc, 2, 2>::run' requested here> ().ru n202( | w e ) ; | ^ RunWork/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppE:l10e:m1e:n tnote: , 2, 2>::run' requested hereF n, T, 10R | eIdMOPpL,_ CAOlLgLo_,F UPNrCo(tAol>l(R)e.druucne(,w eC)O;L L N| E ^T _DIRECT,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp :S10I:M1P:L Enote: ,in instantiation of member function 'RunWork, 2, 2>::run' requested here Sum, h10a | lIfM)P L _| C^O LL_FUN/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hC:(391A:l95l:R enote: dexpanded from macro 'IMPL_COLL_FUNC'u ce, COLL N391E | T _ DRIuRnEWCoTr,k , N C391C | L _ ARLuGnOW_o#r#kau(n)c.#r#udne(v&rnecdcolpSw,o rNkC)C;L _\A L G| O ^_ ##algo, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hN:C562C:L15_:P Rnote: Ofield 'nthreads' will be initialized after field 'tidInBlock'T O_##pr o562t | o > ( ) .triudn((t&indc)c,l Snhtmherme.awdosr(kn)t;h r\e a d| s ^) , tidI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:B562l:o15c:k (note: tfield 'nthreads' will be initialized after field 'tidInBlock'h readId x562. | x ) , gtriodu(pt(igdr)o,u pn)t,h r e| a ^~~~~~~~~~~~~~~~~d s(n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:h562r:60e:a dnote: sfield 'group' will be initialized after field 'stepSize') , tidI n562B | l o c k (ttihdr(etaiddI)d,x .nxt)h,r egardosu(pn(tghrroeuapd)s,) , | t ^~~~~~~~~~~~~~~~~i dI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:B562l:o60c:k (note: tfield 'group' will be initialized after field 'stepSize'h readId x562. | x ) , gtriodu(pt(igdr)o,up )n,t h r| e ^~~~~~~~~~~a ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :| 562 ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~: 15 :| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)warning: initializer order does not match the declaration order [-Wreorder-ctor] 563 | stepSi z562e | ( n c c ltSihdm(etmi.dc)o,m mn.tbhurfefaSdisze(sn[tNhCrCeLa_dPsR)O,T Ot_iSdIIMnPBLlEo]c/kN(CtChLr_eSaTdEIPdSx/.sxi)z,e ogfr(oTu)p)( g{r o u| p ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~) , | group(group| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hn:c626c:l9S:h mnote: ein instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herem .comm.bu f626f | S i z e s [ N C CpLr_iPmRsO(TtOi_dS-ItMiPdLSEt]a/rNtCSCcLa_tStTeErP,S /nsTihzreeoafd(sTS)c)a t{t e r| , ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ N U| L group(groupL , direct->up, args->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hs:e655n:d11b:u ffnote: ,in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here args->re c655v | b u f f , | ^ prims(ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hd:-202t:i53d:S tnote: ain instantiation of member function 'RunWorkElement, 2, 2>::run' requested herer tRedu c202e | , n T h r e a dRsuRneWdourckeE,l enmuelnltp,o uAtl,g oa,r gPsr-o>tsoe>n(d)b.urfufn,( waer)g;s - >| r ^e cvbuff, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp :| 10 ^: 1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202: 5310: | Inote: Min instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereP L_COL L202_ | F U N C ( A l l ReRduuncWeo,r kCEOlLeLmNeEnTt_ ( )| .^r un(we);/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 391| : ^95 : note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: 391note: | in instantiation of member function 'RunWork, 2, 2>::run' requested here RunW o9r | kII,M PNLCEC,L _SAuLmG,O _u#i#anltg6o4,_ tN)C C L| _^P ROTO_##/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hp:r391o:t95o:> (note: )expanded from macro 'IMPL_COLL_FUNC'. run(&ncc l391S | h m eRmu.nwWoorrkk)<;n c\c l F| u ^n c##func, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:y562p:e15,: Fnote: ufield 'nthreads' will be initialized after field 'tidInBlock'n c##dev r562e | d o p i,d )N,C CnLt_hArLeGaOd_s#(#natlhgroe,a dNsC)C,L _tPiRdOITnOB_l#o#cpkr(otthor>e(a)d.Irduxn.(x&)n,c cglrSohumpe(mg.rwoourpk)),; \| ^~~~~~~~~~~~~~~~~ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :note: 562field 'group' will be initialized after field 'stepSize': 15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | 562t | i d ( t itd)i,d (nttihdr)e,a dnst(hnrtehardesa(dnst)h,r etaiddsI)n,B ltoicdkI(ntBhlroecakd(Itdhxr.exa)d,I dgxr.oxu)p,( ggrroouupp)(,g r o| u ^~~~~~~~~~~p ), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_AL G562O | _ # # a ltgiod,( tNiCdC)L,_ PnRtOhTrOe_a#d#sp(rnotthor>e(a)d.sr)u,n (t&indcIcnlBSlhomcekm(.twhorreka)d;I d\x . x| ) ^, group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:15: 563note: | field 'nthreads' will be initialized after field 'tidInBlock' stepSize(n c562c | l S h m etmi.dc(otmimd.)b,u fnftShirzeeasd[sN(CnCtLh_rPeRaOdTsO)_,S ItMiPdLIEn]B/lNoCcCkL(_tShTrEePaSd/Isdixz.exo)f,( Tg)r)o u{p ( g| r ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~o u p| ) group(group, | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 641 :t11i:d (note: tin instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herei d), nthr e641a | d s ( n t h r e a d sp)r,i mtsi(dtIindB-ltoicdkS(ttahrrteRaeddIudcxe.,x )n,T hgrreoaudps(Rgerdouucpe),, d i| r ^~~~~~~~~~~e ct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ edOp, Algo, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(nccl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hS:h562m:e15m:. cwarning: oinitializer order does not match the declaration order [-Wreorder-ctor]m m.buffSizes[NCCL_ P562R | O T O _ StIiMdP(LtEi]d/)N,C CnLt_hSrTeEaPdSs/(snitzheroefa(dTs))), {t i d| I ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~n B l| o group(groupc k(threadIdx.x/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h):,626 :g9ro:u pnote: (in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereg roup), 626| | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) pri m563s | ( t i d -sttiedpSStiazret(SnccactltSehrm,e mn.Tchormema.dbsuSfcfaStitzeers,[ NNCUCLLL_,P RdOiTrOe_cStI-M>PuLpE,] /aNrCgCsL-_>SsTeEnPdSb/usfifz,e oafr(gTs)-)> r{e c v| b ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~u f f| , group(group | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :641:11: 202note: | in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here R u641n | W o r k E l e m e n tpT(h)r.eraudns(Rweed)u;c e ,| ^d irect->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppd:o11w:n1,: & dnote: iin instantiation of member function 'RunWork, 2, 2>::run' requested herer ect-> o11u | tI,M PaLr_gCsO-L>Ls_eFnUdNbCu(fAfl,l Raerdgusc-e>,r eCcOvLbLuNfEfT,_ D I| R ^E CT, SIMP/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:L202E:,53 :S unote: min instantiation of member function 'RunWorkElement, 2, 2>::run' requested here, fl o202a | t ) | ^ Run/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hW:o391r:k95E:l enote: mexpanded from macro 'IMPL_COLL_FUNC'e nt#(#)f.urnucn,( wtey)p;e , | F ^u nc##devre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppd:o10p:<1t:y pnote: ein instantiation of member function 'RunWork, 2, 2>::run' requested here> , NCC L10_ | AILMGPOL__#C#OaLlLg_oF,U NNCC(CALl_lPRReOdTuOc_e#,# pCrOoLtLoN>E(T)_.DrIuRnE(C&Tn,c cSlISMhPmLeEm,. wSourmk,) ;h a\l f )| ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h15::391 :note: 95field 'nthreads' will be initialized after field 'tidInBlock': note: expanded from macro 'IMPL_COLL_FUNC' 562 | 391t | i d (RtuindW)o,r kn,, gNCrCoLu_pA(LgGrOo_u#p#)a,l g o| , ^~~~~~~~~~~~~~~~~ NCC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL:_562P:R60O:T Onote: _field 'group' will be initialized after field 'stepSize'# #proto >562( | ) . r u nt(i&dn(ctcildS)h,m enmt.hwroerakd)s;( n\t h r| e ^a ds), t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hi:d562I:n15B:l onote: cfield 'nthreads' will be initialized after field 'tidInBlock'k (threa d562I | d x . x )t,i dg(rtoiudp)(,g rnotuhpr)e,a d s| ( ^~~~~~~~~~~n threads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hwe:)562;: 15 :| ^warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 562 | 9 | ItMiPdL(_tCiOdL)L,_ FnUtNhCr(eAaldlsR(endtuhcree,a dCsO)L,L NtEiTd_IDnIBRlEoCcTk,( tShIrMePaLdEI,d xS.uxm),, ugirnotu6p4(_gtr)o u p| )^, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)391 :95: note: expanded from macro 'IMPL_COLL_FUNC' 563 | st e391p | S i zReu(nnWcocrlkS_,S TNECPCSL/_sAiLzGeOo_f#(#Ta)l)g o{, N| C ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~C L _| P group(groupR OTO_##proto>().run(&n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hc:c655l:S11h:m enote: min instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here. work); \ 655 | | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 :p15r:i mnote: sfield 'nthreads' will be initialized after field 'tidInBlock'( tid-ti d562S | t a r t Rteiddu(ctei,d )n,T hnrtehardesaRdesd(uncteh,r enaudlsl)p,t rt,i d&IdniBrleocctk-(>tohurte,a daIrdgxs.-x>)s,e ngdrbouufpf(,g raorugps)-,> r e| c ^~~~~~~~~~~~~~~~~v buf/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hf:,562 : 60| : ^ note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h: 202562: | 53 : note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested heret id(ti d202) | , n t h r e a dRsu(nnWtohrrkeEaldesm)e,n tto(u)p.(rgurno(uwpe)),; | | ^~~~~~~~~~~ ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWorkd,) ,N CnCtLh_rAeLaGdOs_(#n#tahlrgeoa,d sN)C,C Lt_iPdRIOnTBOl_o#c#kp(rtohtroe>a(d)I.drxu.nx()&,n cgcrloSuhpm(egmr.owuopr)k,) ; | \ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | | ^ tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h: 562563: | 15 : note: field 'nthreads' will be initialized after field 'tidInBlock's tepSiz e562( | n c c l Sthimde(mt.icdo)m,m .nbtuhfrfeSaidzse(sn[tNhCrCeLa_dPsR)O,T Ot_iSdIIMnPBLlEo]c/kN(CtChLr_eSaTdEIPdSx/.sxi)z,e ogfr(oTu)p)( g{r o u| p ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~) , | group(group| ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: 562note: | in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here tid( t666i | d ) , n t h r epardism(sn(tthirde,a dnsT)h,r etaiddsIGnaBtlhoecrk,( tdhirreeacdtI-d>xu.px,) ,N UgLrLo,u pa(rggrso-u>ps)e,n d b| u ^~~~~~~~~~~f f, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) , 563 | st enptShirzeea(dnsc(cnltShhrmeeamd.sc)o,m mt.ibduIfnfBSilzoecsk[(NtChCrLe_aPdRIOdTxO._xS)I,M PgLrEo]u/pN(CgCrLo_uSpT)E,P S /| s ^~~~~~~~~~~~~~~~~i zeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677: 11562: | note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here tid(tid )677, | n t h r e a d s ( nptrhirmesa(dtsi)d,- ttiiddSItnaBrltoBccka(stth,r enaTdhIrdexa.dxs)B,c agsrto,u p&(dgirroeucpt)-,> o u| t ^~~~~~~~~~~, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/N/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h>:(562):.15r:u nwarning: (initializer order does not match the declaration order [-Wreorder-ctor]& ncclShmem.wor k562) | ; \ t| i ^d (tid),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :n562t:h15r:e anote: dfield 'nthreads' will be initialized after field 'tidInBlock's (nthre a562d | s ) , ttiiddI(ntBildo)c,k (ntthhrreeaaddIsd(xn.txh)r,e agdrso)u,p (tgirdoIunpB)l,o c k| ( ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t h r| e tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)a dIdx.x )563, | g r o uspt(egprSoiuzpe)(,n c c| l ^~~~~~~~~~~~~~~~~S hme/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hm:.562c:o60m:m .note: bfield 'group' will be initialized after field 'stepSize'u ffSize s562[ | N C C L _tPiRdO(TtOi_dS)I,M PnLtEh]r/eNaCdCsL(_nStThErPeSa/dssi)z,e otfi(dTI)n)B l{o c k| ( ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~t h r| e group(groupa dIdx.x), gr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ho:u626p:(9g:r onote: uin instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herep ), | ^~~~~~~~~~~ 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hC:562:15: warning: Cinitializer order does not match the declaration order [-Wreorder-ctor]L _STEPS/sizeof(T)) { 562 | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | t group(groupi d(tid), nthreads(nthreads), ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hd:I677n:B11l:o cnote: kin instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here( threadIdx .677x | ) , g r o u p ( g rporuipm)s,( t i| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~- t i| d tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)S tar t563B | c a s t ,s tneTphSriezaed(snBcccalsSth,m e&md.icroemcmt.-b>uofuftS,i zdeisr[eNcCtC-L>_dPoRwOnT,O _aSrIgMsP-L>Es]e/nNdCbCuLf_fS,T EaPrSg/ss-i>zreeocfv(bTu)f)f ,{ | | ^ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 687 : 11 : note: Rin instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereu nWorkEl e687m | e n t < F n , T , pRreidmOsp(,t iAdl-gtoi,d SPtraorttoB>c(a)s.tr,u nn(Twher)e;a d s| B ^c ast, &di/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppr:e9c:t1-:> onote: uin instantiation of member function 'RunWork, 2, 2>::run' requested heret , nul l9p | tIrM,P La_rCgOsL-L>_sFeUnNdCb(uAflfl,R eadrugcse-,> rCeOcLvLbNuEfTf_,D I R| E ^C T, SIMPLE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h,: 202S:u53m:, note: uin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herei nt64_ t202) | | ^ Run/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hW:o391r:k95E:l enote: mexpanded from macro 'IMPL_COLL_FUNC'e nt#(#)f.urnucn,( wtey)p;e , | F ^u nc##devr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppe:d10o:p1<:t ynote: pin instantiation of member function 'RunWork, 2, 2>::run' requested heree >, NC C10L | _IAMLPGLO__C#O#LaLl_gFoU,N CN(CAClLl_RPeRdOuTcOe_,# #CpOrLoLtNoE>T(_)D.IrRuEnC(T&,n cScIlMSPhLmEe,m .Swuomr,k )h;a l\f ) | ^| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::391562::9515:: note: note: expanded from macro 'IMPL_COLL_FUNC'field 'nthreads' will be initialized after field 'tidInBlock' 562391 | | R utniWdo(rtkid,x .NxC)C,L _gArLoGuOp_(#g#raolugpo),, N C| C ^~~~~~~~~~~~~~~~~L _PR/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hO:T562O:_60#:# pnote: rfield 'group' will be initialized after field 'stepSize'o to>(). r562u | n ( & n ctcildS(htmiedm).,w onrtkh)r;e a\d s (| n ^t hreads)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h,: 562t:i15d:I nnote: Bfield 'nthreads' will be initialized after field 'tidInBlock'l ock(th r562e | a d I d xt.ixd)(,t igdr)o,u pn(tghrroeuapd)s,( n t| h ^~~~~~~~~~~r eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h().run(:w562e:)15;: warning: | initializer order does not match the declaration order [-Wreorder-ctor] ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 56211 | | I M P Lt_iCdO(LtLi_dF)U,N Cn(tAhlrleRaeddsu(cnet,h rCeOaLdLsN)E,T _tDiIdRIEnCBTl,o cSkI(MtPhLrEe,a dSIudmx,. xf)l,o agtr)o u p| (^g roup)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h,: 391 :| 95 ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~: note: | expanded from macro 'IMPL_COLL_FUNC' tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563391 | | R usntWeoprSkiP,L EN]C/CNLC_CALL_GSOT_E#P#Sa/lsgioz,e oNfC(CTL)_)P R{O T O| _ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~# # p| r group(groupo to>().run(&ncclShmem/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h.:w626o:r9k:) ;note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here\ | ^ 626 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 : 15 : note: field 'nthreads' will be initialized after field 'tidInBlock'p rims(t i562d | - t i d Sttiadr(ttSicda)t,t enrt,h rneTahdrse(andtshSrceaatdtse)r,, tNiUdLILn,B ldoicrke(ctth-r>euapd,I daxr.gxs)-,> sgernodubpu(fgfr,o uapr)g,s - >| r ^~~~~~~~~~~~~~~~~e cv/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hb:u562f:f60,: note: | field 'group' will be initialized after field 'stepSize' ^ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 202 :t53i:d (note: tin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herei d), n t202h | r e a d s ( n t hRruenaWdosr)k,E lteimdeInntBr(o)u.pr)u,n ( w| e ^~~~~~~~~~~) ; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::562562::1515:: warning: warning: initializer order does not match the declaration order [-Wreorder-ctor]initializer order does not match the declaration order [-Wreorder-ctor] 562 | 562t | i d ( t itdi)d,( tnitdh)r,e andtsh(rnetahdrse(andtsh)r,e atdisd)I,n BtliodcIkn(Btlhorceka(dtIhdrxe.axd)I,d xg.rxo)u,p (ggrroouupp()g,r o u| p ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~) , | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)563 | s t563e | p S i z es(tnecpcSliSzhem(enmc.ccloSmhmm.ebmu.fcfoSmimz.ebsu[fNfCSCiLz_ePsR[ONTCOC_LS_IPMRPOLTEO]_/SNICMCPLL_ES]T/ENPCSC/Ls_iSzTeEoPfS(/Ts)i)z e{o f (| T ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~) ) | { group(group | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: 641in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here | 677 | p r i m s ( t i d - tpirdiSmtsa(rttiRde-dtuicdeS,t anrTthBrceaasdts,R endTuhcree,a ddsiBrceacstt-,> d&odwinr,e c&td-i>roeuctt,- >doiurte,c ta-r>gdso-w>ns,e nadrbgusf-f>,s eanrdgbsu-f>fr,e cavrbgusf-f>,r e c| v ^b uff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hin instantiation of member function 'RunWorkElement, 2, 2>::run' requested here: 202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here202 | 202 | R u n W o r kREulneWmoernktE (P)r.ortuon>((w)e.)r;u n (| w ^e ); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp :note: 11in instantiation of member function 'RunWork, 2, 2>::run' requested here: 1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMP L11_ | CIOMLPLL__FCUONLCL(_AFlUlNRCe(dAulcleR,e dCuOcLeL,N ECTO_LDLINREETC_TD,I RSEICMTP,L ES,I MSPuLmE,, hSaulmf,) f l| o^a t) | ^/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :391:95: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hnote: :expanded from macro 'IMPL_COLL_FUNC'391 :95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | Ru n391W | o r kRp,< tNyCpCeL>_,A LNGCOC_L#_#AaLlGgOo_,# #NaClCgLo_,P RNOCTCOL__##protPoR>O(T)O._r#u#np(r&ontcoc>l(S)h.mreumn.(w&onrckc)l;S h\m e m| . ^w ork); \ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :| 562 ^: 15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562: 15562: | note: field 'nthreads' will be initialized after field 'tidInBlock' tid(t i562d | ) , n tthirde(atdisd()n,t hnrtehardesa)d,s (tnitdhIrneBaldosc)k,( tthirdeIandBIldoxc.kx()t,h rgeraoduIpd(xg.rxo)u,p )g,r o u| p ^~~~~~~~~~~~~~~~~( gro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:p562):,60 : | note: ^~~~~~~~~~~~~~~~~field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562: 60562: | note: field 'group' will be initialized after field 'stepSize' tid(t i562d | ) , n tthirde(atdisd()n,t hnrtehardesa)d,s (tnitdhIrneBaldosc)k,( tthirdeIandBIldoxc.kx()t,h rgeraoduIpd(xg.rxo)u,p )g,r o u| p ^~~~~~~~~~~( group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWorkt,i dN(CtCiLd_)A,L GnOt_h#r#eaaldgso(,n tNhCrCeLa_dPsR)O,T Ot_i#d#IpnrBoltooc>k(()t.hrruena(d&Indcxc.lxS)h,m egmr.owuopr(kg)r;o u\p ) ,| ^ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:15: note: 563field 'nthreads' will be initialized after field 'tidInBlock' | st e562p | S i z e (tnicdc(ltSihdm)e,m .nctohmrme.abdusf(fnStihzreesa[dNsC)C,L _tPiRdOITnOB_lSoIcMkP(LtEh]r/eNaCdCILd_xS.TxE)P,S /gsriozuepo(fg(rTo)u)p ){, | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~~~~~~~ | group(group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:60: note: field 'group' will be initialized after field 'stepSize' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 626 :t9i:d (note: tin instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herei d), nth r626e | a d s ( n t h r epardism)s,( ttiiddI-ntBildoSctka(rtthSrceaatdtIedrx,. xn)T,h rgeraoduspS(cgartotuepr),, N U| L ^~~~~~~~~~~L , direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(Al/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hl:R562e:d15u:c ewarning: ,initializer order does not match the declaration order [-Wreorder-ctor] COLLNET_DIRECT, S I562M | P L E , tSiudm(,t ifdl)o,a tn)t h r| e^a ds(nt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hh:r391e:a95d:s )note: ,expanded from macro 'IMPL_COLL_FUNC' tidInBlo c391k | ( t hRruenaWdoIrdkx<.nxc)c,l Fgurnocu#p#(fgurnocu,p )t,y p e| , ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ F u| n tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)c ##devr e563d | o p < t ysptee>p,S NiCzCeL(_nAcLcGlOS_h#m#eaml.gcoo,m mN.CbCuLf_fPSRiOzTeOs_[#N#CpCrLo_tPoR>O(T)O._rSuInM(P&LnEc]c/lNSChCmLe_mS.TwEoPrSk/)s;i z\e o f| ( ^T )) { /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h| : ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~562 : 15| : group(group note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h(:t655i:d11):, note: nin instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heret hreads( n655t | h r e a d s ) , t ipdrIinmBsl(otcikd(-tthirdeSatdaIrdtxR.exd)u,c eg,r onuTph(rgeraoduspR)e,d u c| e ^~~~~~~~~~~~~~~~~, n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:ll562p:t60r:, note: &field 'group' will be initialized after field 'stepSize'd irect- >562o | u t , atrigds(-t>isde)n,d bnutfhfr,e aadrsg(sn-t>hrreecavdbsu)f,f ,t i d| I ^n Block(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hh:r202e:a53d:I dnote: xin instantiation of member function 'RunWorkElement, 2, 2>::run' requested here. x), g r202o | u p ( g r o u p )R,u n W| o ^~~~~~~~~~~r kElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hout, arg:s562-:>15s:e nwarning: dbinitializer order does not match the declaration order [-Wreorder-ctor]u ff, args->recvbuff, | ^562 | ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hd:(202t:i53d:) ,note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested heren threa d202s | ( n t h r e a d s)R,u ntWiodrIknEBlleomcekn(tt ( )| . ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~r u n| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)w e); | ^ 563 | st/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppe:p12S:iz1e:( nnote: cin instantiation of member function 'RunWork, 2, 2>::run' requested herec lShme m12. | cIoMmPmL._bCuOfLfLS_iFzUeNsC[(NAClClLR_ePdRuOcTeO,_ SCIOMLPLLNEE]T/_NDCICRLE_CSTT,E PSSI/MsPiLzEe,o fS(uTm),) d{o u b| l ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~e ) | group(group| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :R677u:n11W:o rnote: kin instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here< ncclFunc #677# | f u n c , t y p e ,p rFiumnsc(#t#idde-vtrieddSotpas,t ,N CnCTLh_rAeLaGdOs_B#c#aasltg,o &,d iNrCeCcLt_-P>RoOuTtO,_ #d#iprreoctto->>(d)o.wrnu,n (a&rngcsc-l>Sshemnedmb.uwfofr,k )ar;g s\- > r| e ^c vbuff/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h,: 562 :| 15 ^: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :562202 | : 53 : note: tin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herei d(tid )202, | n t h r e a dRsu(nnWtohrrkeEaldesm)e,n tto(u)p.(rgurno(uwpe)),; | | ^~~~~~~~~~~~~~~~~ ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp :11note: :field 'group' will be initialized after field 'stepSize'1 : note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 562 | 11 | tIiMdP(Lt_iCdO)L,L _nFtUhNrCe(aAdlsl(Rnetdhurceea,d CsO)L,L NtEiTd_IDnIBRlEoCcTk,( tShIrMePaLdEI,d xS.uxm),, fglrooautp)( g r| o^u p), | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h ^~~~~~~~~~~: 391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hexpanded from macro 'IMPL_COLL_FUNC' :562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]391 | RunWorkt,i dNICnCBLl_oAcLkG(Ot_h#r#eaaldgIod,x .NxC)C,L _gPrRoOupT(Og_r#o#uppr)o,t o >| ( ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~) . r| u tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)n (&ncclS h563m | e m . w osrtke)p;S i\z e (| n ^c clShm/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:m562.:c15o:m mnote: .field 'nthreads' will be initialized after field 'tidInBlock'b uffSiz e562s | [ N C C Lt_iPdR(OtTiOd_)S,I MnPtLhEr]e/aNdCsC(Ln_tShTrEePaSd/ss)i,z etoifd(ITn)B)l o{c k (| t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~h r e| a group(groupd Idx.x), group(group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h):,626 : 9| : ^~~~~~~~~~~~~~~~~ note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:60: note: field 'group' will be initialized after field 'stepSize' 626 | 562 | p rtiimds((ttiidd)-,t indtShtraeratdSsc(antttherre,a dnsT)h,r etaiddsISncBaltotcekr(,t hNrUeLaLd,I ddxi.rxe)c,t -g>ruopu,p (agrrgosu-p>)s,e n d| b ^~~~~~~~~~~u ff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 :t15i:d (warning: tinitializer order does not match the declaration order [-Wreorder-ctor]i d), nthreads(nthrea d562s | ) , t itdiIdn(Btliodc)k,( tnhtrheraedaIddsx(.nxt)h,r egardosu)p,( gtrioduIpn)B,l o c| k ^~~~~~~~~~~~~~~~~( thr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:a562d:I60d:x .note: xfield 'group' will be initialized after field 'stepSize') , grou p562( | g r o u pt)i,d ( t| i ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~d ) ,| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)n thread s563( | n t h r esatdesp)S,i ztei(dnIcncBllSohcmke(mt.hcroemamd.Ibduxf.fxS)i,z egsr[oNuCpC(Lg_rPoRuOpT)O,_ S I| M ^~~~~~~~~~~P LE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, dir/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ect->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##pr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:t562o:>15(:) .warning: rinitializer order does not match the declaration order [-Wreorder-ctor]u n(&ncclShmem.w o562r | k ) ; \t i d| ( ^t id), n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:h562r:e15a:d snote: (field 'nthreads' will be initialized after field 'tidInBlock'n thread s562) | , t i dtIindB(ltoicdk)(,t hnrtehardeIaddxs.(xn)t,h rgeraodusp)(,g rtoiudpI)n,B l o| c ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~k ( t| h tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)r eadIdx .563x | ) , g rsotuepp(Sgirzoeu(pn)c,c l S| h ^~~~~~~~~~~~~~~~~m em./usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hc:o562m:m60.:b unote: ffield 'group' will be initialized after field 'stepSize'f Sizes[ N562C | C L _ P RtOiTdO(_tSiIdM)P,L En]t/hNrCeCaLd_sS(TnEtPhSr/esaidzse)o,f (tTi)d)I n{B l o| c ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~k ( t| h group(groupr eadIdx.x), grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hp:(677g:r11o:u pnote: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here ), | ^~~~~~~~~~~ 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:T)562): 15{: warning: | initializer order does not match the declaration order [-Wreorder-ctor] ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 562 | ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hd:(677t:i11d:) ,note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heren threads (677n | t h r e a d s ) , tpirdiImnsB(ltoicdk-(ttihdrSetaadrItdBxc.axs)t,, gnrTohurpe(agdrsoBucpa)s,t , | & ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~d i r| e tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)c t->o u563t | , d i rsetcetp-S>idzoew(nn,c calrSghsm-e>ms.ecnodmbmu.fbfu,f faSrigzse-s>[rNeCcCvLb_uPfRfO,T O _| S ^I MPLE]/NCC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hL:_202S:T53E:P Snote: /in instantiation of member function 'RunWorkElement, 2, 2>::run' requested heres izeof (202T | ) ) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ R u| n group(groupW orkElement, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereg o, Prot o641> | ( ) . r u n ( w e ) ;p r i| m ^s (tid-tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppS:t12a:r1t:R enote: din instantiation of member function 'RunWork, 2, 2>::run' requested hereu ce, n T12h | rIeMaPdLs_RCeOdLuLc_eF,U NdCi(rAelcltR-e>dduocwen,, C&OdLiLrNeEcTt_-D>IoRuEtC,T ,a rSgIsM-P>LsEe,n dSbuumf,f ,d oaurbglse-)> r e| c^v buff, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :| 391 ^: 95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: 391in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here | Run W202o | r k < n c c l F uRnucn#W#ofruknEcl,e mteynpte<,F nF,u nTc,# #RdeedvOrpe,d oAplr,o tNoC>C(L)_.ArLuGnO(_w#e#)a;l g o| , ^ NCCL_PR/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppO:T12O:_1#:# pnote: rin instantiation of member function 'RunWork, 2, 2>::run' requested hereo to>() .12r | uInM(P&Ln_cCcOlLSLh_mFeUmN.Cw(oArlkl)R;e d\u c e| , ^ COLLNET/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h_:D562I:R15E:C Tnote: ,field 'nthreads' will be initialized after field 'tidInBlock' SIMPLE ,562 | S u m , tdiodu(btlied)) , | n^t hread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hs:(391n:t95h:r enote: aexpanded from macro 'IMPL_COLL_FUNC'd s), tidI n391B | l o cRku(ntWhorreka, N562C | C L _ A LtGiOd_(#t#iadl)g,o ,n tNhCrCeLa_dPsR(OnTtOh_r#e#apdrso)t,o >t(i)d.IrnuBnl(o&cnkc(ctlhSrhemaedmI.dwxo.rxk)),; g\r o u| p ^( group)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h,: 562 :| 15 ^~~~~~~~~~~: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h^ :/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h562::39115::95 :warning: initializer order does not match the declaration order [-Wreorder-ctor]note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWo r562k | < n c c ltFiudn(ct#i#df)u,n cn,t htryepaed,s (Fnutnhcr#e#addesv)r,e dtoipdc,k (NtChCrLe_aAdLIGdOx_.#x#)a,l ggor,o uNpC(CgLr_oPuRpO)T,O _ #| # ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~p r o| t tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)o >().ru n563( | & n c c lsSthempeSmi.zweo(rnkc)c;l S\h m e| m ^. comm./usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hb:u562f:f15S:i znote: efield 'nthreads' will be initialized after field 'tidInBlock's [NCCL_ P562R | O T O _ StIiMdP(LtEi]d/)N,C CnLt_hSrTeEaPdSs/(snitzheroefa(dTs))), {t i d| I ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~n B l| o group(groupc k(threadIdx.x), group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h(:g687r:o11u:p )note: ,in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :687562 | : 60 : note: field 'group' will be initialized after field 'stepSize' pr i562m | s ( t i dt-itdi(dtSitda)r,t Bnctahsrte,a dnsT(hnrtehardesaBdcsa)s,t ,t i&ddIinrBelcotc-k>(otuhtr,e anduIldlxp.txr),, agrrgosu-p>(sgernodubpu)f,f , | a ^~~~~~~~~~~r gs->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roup), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h; : 562| : ^15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | 562I | M P L _ CtOiLdL(_tFiUdN)C,( AnltlhRreedaudcse(,n tChOrLeLaNdEsT)_,D ItRiEdCITn,B lSoIcMkP(LtEh,r eSaudmI,d xr.cxc)l,_ bgfrloouapt(1g6r)o u p| )^, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)391 :95: note: expanded from macro 'IMPL_COLL_FUNC' 563 | st e391p | S i zReu(nnWcocrlkSL,_ SNTCECPLS_/AsLiGzOe_o#f#(aTl)g)o ,{ N C| C ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~L _ P| R group(groupO TO_##proto>().run/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h(:&641n:c11c:l Snote: hin instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herem em.work) ;641 | \ | ^ p/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:i562m:s15(:t inote: dfield 'nthreads' will be initialized after field 'tidInBlock'- tidSta r562t | R e d u ctei,d (ntTihdr)e,a dnstRherdeuacdes,( ndtihrreecatd-s>)d,o wtni,d I&ndBilroecckt(-t>horueta,d Iadrxg.sx-)>,s egnrdobuupf(fg,r oaurpg)s,- > r| e ^~~~~~~~~~~~~~~~~c vbu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hf:f562,: 60 :| ^note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h: 202562: | 53 : note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested heret id(ti d202) | , n t h r e a dRsu(nnWtohrrkeEaldesm)e,n tto(u)p.(rgurno(uwpe)),; | | ^~~~~~~~~~~ ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##a/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hl:g562o:,15 :N Cwarning: Cinitializer order does not match the declaration order [-Wreorder-ctor]L _PROTO_##proto >562( | ) . r u nt(i&dn(ctcildS)h,m enmt.hwroerakd)s;( n\t h r| e ^a ds), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:i562d:I15n:B lnote: ofield 'nthreads' will be initialized after field 'tidInBlock'c k(thre a562d | I d x . xt)i,d (gtriodu)p,( gnrtohurpe)a,d s (| n ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t h r| e tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)a ds), t i563d | I n B l osctke(ptShirzeea(dnIcdcxl.Sxh)m,e mg.rcooumpm(.gbruofufpS)i,z e s| [ ^~~~~~~~~~~~~~~~~N C/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hC:L562_:P60R:O Tnote: Ofield 'group' will be initialized after field 'stepSize'_ SIMPLE ]562/ | N C C L _tSiTdE(PtSi/ds)i,z enotfh(rTe)a)d s{( n t| h ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r e a| d group(groups ), tidInBloc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hk:(666t:h9r:e anote: din instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereI dx.x), 666g | r o u p ( g r o uppr)i,m s (| t ^~~~~~~~~~~i d, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWork/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hE:l562e:m15e:n twarning: i(d)(.triudn)(,w en)t;h r e| a ^d s(nthrea/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cppd:s12):,1 :t inote: din instantiation of member function 'RunWork, 2, 2>::run' requested hereI nBloc k12( | tIhMrPeLa_dCIOdLxL._xF)U,N Cg(rAolulpR(egdruocuep,) , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx941. 67 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx940. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for host. 67 warnings generated when compiling for gfx803. 67 warnings generated when compiling for gfx1101. 67 warnings generated when compiling for gfx1102. 67 warnings generated when compiling for gfx1100. 67 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGOIn file included from _#/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp#:a1l: gIn file included from o/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h,: 10N: CIn file included from C/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.hL:_169P: R/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.hO:T271O:_19#:# pwarning: runused variable 'ptr' [-Wunused-variable]o to>().run (271& | n c c l S h m e mu.iwnotr6k4)_;t *\ p t| r ^ = recv/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hP:t562r:(150:) +note: lfield 'nthreads' will be initialized after field 'tidInBlock'l 128Off s562e | t ; | t ^~~i d(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.b/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ uffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.wo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rk); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: 562initializer order does not match the declaration order [-Wreorder-ctor] | tid(tid), nthrea d562s | ( n t h rteiadd(st)i,d )t,i dnItnhBrleoacdks((tnhtrheraedaIddsx).,x )t,i dgIrnoBulpo(cgkr(otuhpr)e,a d I| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~x . x| ) tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T), group( g563r | o u p ) ,s t e| p ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~S i z| e tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)( ncclShm e563m | . c o m ms.tbeupfSfiSziez(ensc[cNlCSChLm_ePmR.OcToOm_mS.IbMuPfLfES]i/zNeCsC[LN_CSCTLE_PPSR/OsTiOz_eSoIfM(PTL)E)] /{N C C| L ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~_ S T| E group(groupP S/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h655: | 677 : 11 : note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here prims( t677i | d - t i d S t a r t Rperdiumcse(,t indT-htriedaSdtsaRretdBuccaes,t ,n unlTlhprtera,d s&Bdciarsetc,t -&>doiurte,c ta-r>gosu-t>,s ednidrbeucftf-,> daorwgns,- >arregcsv-b>usfefn,d b u| f ^f , args->r/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:c202v:b53u:f fnote: ,in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here | ^ 202 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 202 :R53u:n Wnote: oin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herer kEleme n202t | < F n , T , RReudnOWpo,r kAEllgeom,e nPtr (T),. rRuend(Owpe,) ;A l g| o ^, Proto>(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp):.4r:u1n:( wnote: ein instantiation of member function 'RunWork, 2, 2>::run' requested here) ; | ^ 4 | IMPL_C/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cppO:L4L:_1F:U Nnote: Cin instantiation of member function 'RunWork, 2, 2>::run' requested here( AllRe d4u | cIeM,P LC_OCLOLLNLE_TF_UDNICR(EAClTl,R eSdIuMcPeL,E ,C OPLrLoNdE,T _iDnItR8E_CtT), S| I^M PLE, P/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:o391d:,95 :i nnote: texpanded from macro 'IMPL_COLL_FUNC'8 _t) 391 | | ^ RunWor/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hk:<391n:c95c:l Fnote: uexpanded from macro 'IMPL_COLL_FUNC'n c##func, 391t | y p eR,u nFWuonrck#<#ndcecvlrFeudnocp#<#tfyupnec>,, tNyCpCeL,_ AFLuGnOc_####daelvgroe,d oNpCO,T ON_C#C#Lp_rAoLtGoO>_(#)#.arlugno(,& nNcCcClLS_hPmReOmT.Ow_o#r#kp)r;o t\o > (| ) ^. run(&ncc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hl:S562h:m15e:m .note: wfield 'nthreads' will be initialized after field 'tidInBlock'o rk); \ 562| | ^ tid(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:i562d:)15,: nnote: tfield 'nthreads' will be initialized after field 'tidInBlock'h reads(n t562h | r e a d st)i,d (ttiiddI)n,B lnotchkr(etahdrse(andtIhdrxe.axd)s,) ,g rtoiudpI(ngBrlooucpk)(,t h r| e ^~~~~~~~~~~~~~~~~a dIdx/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h.:x562):,60 :g rnote: ofield 'group' will be initialized after field 'stepSize'u p(grou p562) | , | ^~~~~~~~~~~~~~~~~t id(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:i562d:)60,: nnote: tfield 'group' will be initialized after field 'stepSize'h reads( n562t | h r e a dtsi)d,( ttiidd)I,n Bnltohcrke(atdhsr(enatdhIrdexa.dxs)),, gtrioduIpn(Bglroocukp()t,h r e| a ^~~~~~~~~~~d Idx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h | ^~~~~~~~~~~ :562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 : 15t:i dwarning: (initializer order does not match the declaration order [-Wreorder-ctor]t id), nthreads(nth r562e | a d s ) ,t itdi(dtIindB)l,o cnkt(htrheraedasd(Indtxh.rxe)a,d sg)r,o utpi(dgIrnoBulpo)c,k ( t| h ^~~~~~~~~~~~~~~~~r ead/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hI:d562x:.60x:) ,note: field 'group' will be initialized after field 'stepSize'g roup( g562r | o u p ) ,t i d| ( ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t i d| ) tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T), nth r563e | a d s ( nsttherpeSaidzse)(,n ctcildInBlock(thrSeadIdx.x)h,m egmr.ocuopm(mg.rbouufpf)S,i z e| s ^~~~~~~~~~~[ NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock'/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:A562l:l15R:e dwarning: uinitializer order does not match the declaration order [-Wreorder-ctor]c e, COLLNET_DIRECT, 562S | I M P L Et,i dP(rtoidd,) ,u inntth6r4e_atd)s ( n| t^h reads/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h):,391 :ti95d:I nnote: Bexpanded from macro 'IMPL_COLL_FUNC'l ock(thre a391d | Id x .Rxu)n,W ogrrkoc,l SNhCmCeLm_.AcLoGmOm_.#b#uaflfgSoi,z eNsC[CNLC_CPLR_OPTROO_T#O#_pSrIoMtPoL>E(])/.NrCuCnL(_&SnTcEcPlSS/hsmiezme.owfo(rTk))); {\ | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ ^ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h562: | 626 : 9 : tnote: iin instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hered (tid), n t626h | r e a d s ( n t hprreiamdss()t,i dt-itdiIdnSBtlaorctkS(ctahtrteeard,I dnxT.hxr)e,a dgsrSocuapt(tgerro,u pN)U,L L ,| ^~~~~~~~~~~~~~~~~d ire/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hc:t562-:>60u:p ,note: field 'group' will be initialized after field 'stepSize'a rgs->s e562n | d b u f ft,i da(rtgisd-)>,r enctvhbruefafd,s ( n| t ^h reads),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :t202i:d53I:n Bnote: lin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereo ck(th r202e | a d I d x . x ) ,R ugnrWoourpk(Eglreomuepn)t,< F n| , ^~~~~~~~~~~ T, RedOp, Algo, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | Ru/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(nccl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hS:h562m:e15m:. cwarning: oinitializer order does not match the declaration order [-Wreorder-ctor]m m.buffSizes[NCC L562_ | P R O T Ot_iSdI(MtPiLdE)],/ NnCtChLr_eSaTdEsP(Sn/tshirzeeaodfs()T,) )t i{d I n| B ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~l o c| k group(group( threadIdx.x), grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hp:(666g:r9o:u pnote: )in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | 666 tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) | 563 | p r i m ss(tteipdS,i zneT(hnrcecaldSshGmaetmh.erc,o mdmi.rbeucftf-S>iuzpe,s [NNUCLL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ CL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::391562::9515:: note: warning: expanded from macro 'IMPL_COLL_FUNC'initializer order does not match the declaration order [-Wreorder-ctor] 391 | Ru n562W | o r k < ntcicdl(Ftuindc)#,# fnutnhcr,e atdysp(en,t hFruenacd#s#)d,e vtrieddIonpBt,h rNeCaCdLI_dAxL.GxO)_,# #garloguop,( gNrCoCuLp_)P,R O T| O ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~_ # #| p tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)r oto>(). r563u | n ( & n csctleSphSmiezme.(wnocrckl)S;h m\e m .| c ^o mm.buff/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hS:i562z:e15s:[ Nnote: Cfield 'nthreads' will be initialized after field 'tidInBlock'C L_PROT O562_ | S I M P LtEi]d/(NtCiCdL)_,S TnEtPhSr/esaidzse(onft(hTr)e)a d{s ) ,| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~t i d| I group(groupn Block(threadI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hd:x687.:x11):, note: gin instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herer oup(grou p687) | , | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562p:r60i:m snote: (field 'group' will be initialized after field 'stepSize't id-tid S562t | a r t B ctaisdt(,t indT)h,r enatdhsrBecaadsst(,n t&hdrieraedcst)-,> otuitd,I nnBullolcpkt(rt,h raeragdsI-d>xs.exn)d,b ugfrfo,u pa(rggrso-u>pr)e,c v b| u ^~~~~~~~~~~f f, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, up(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_#/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h#:a562l:g15o:, warning: Ninitializer order does not match the declaration order [-Wreorder-ctor]C CL_PROTO_##pro t562o | > ( ) . rtuind((&tnicdc)l,S hnmtehmr.ewaodrsk()n;t h\r e a| d ^s ), ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:I562n:B15l:o cnote: kfield 'nthreads' will be initialized after field 'tidInBlock'( threa d562I | d x . x )t,i dg(rtoiudp)(,g rnotuhpr)e,a d s| ( ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~n t h| r tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)e ads), t i563d | I n B l osctke(ptShirzeea(dnIcdcxl.Sxh)m,e mg.rcooumpm(.gbruofufpS)i,z e s| [ ^~~~~~~~~~~~~~~~~N CCL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h_:P562R:O60T:O _note: Sfield 'group' will be initialized after field 'stepSize'I MPLE]/ N562C | C L _ S TtEiPdS(/tsiidz)e,o fn(tTh)r)e a{d s (| n ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~t h r| e group(groupa ds), tidInBloc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hk:(666t:h9r:e anote: din instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereI dx.x), g666r | o u p ( g r o u pp)r,i m s| ( ^~~~~~~~~~~t id, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ e, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &d/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ irect->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args-/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ >sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, ar/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ gs->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^562 | tid(tid), nthreads(nt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpph:r8e:a1d:s )note: ,in instantiation of member function 'RunWork, 2, 2>::run' requested here tidInBlo c8k | (ItMhPrLe_aCdOILLd_xF.UxN)C,( AglrloRuepd(ugcreo,u pC),O L L| N ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~E T _| D tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)I RECT, S563I | M P L E ,s tPerpoSdi,z ei(nntc6c4l_Sth)m e m| .^c omm.buf/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hf:S391i:z95e:s [note: Nexpanded from macro 'IMPL_COLL_FUNC'C CL_PROTO _391S | I M PRLuEn]W/oNrCkC, NCCL_ALGO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h_:#687#:a11l:g onote: ,in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here NCCL_PRO T687O | _ # # p r o t o > ( )p.rriumns((&tnicdc-ltSihdmSetma.rwtoBrcka)s;t ,\ n T| h ^r eadsBcast,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :&562d:i15r:e cnote: tfield 'nthreads' will be initialized after field 'tidInBlock'- >out, nu l562l | p t r , tairdg(st-i>ds)e,n dnbtuhfrfe,a dasr(gnst-h>rreeacdvsb)u,f ft,i d I| n ^B lock(thre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ha:d202I:d53x:. xnote: )in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here, grou p202( | g r o u p ) , R| u ^~~~~~~~~~~~~~~~~n Wo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:k562E:l60e:m enote: nfield 'group' will be initialized after field 'stepSize't e(a)d.sr(unnt(hwree)a;d s )| , ^ tidInBl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cppo:c8k:(1t:h rnote: ein instantiation of member function 'RunWork, 2, 2>::run' requested herea dIdx. x8) | ,I MgPrLo_uCpO(LgLr_oFuUpN)C,( A l| l ^~~~~~~~~~~R educe, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ idInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLN/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hE:T562_:D15I:R Ewarning: Cinitializer order does not match the declaration order [-Wreorder-ctor]T , SIMPLE, Prod, 562u | i n t 6 4t_itd)( t i| d^) , nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:e391a:d95s:( nnote: texpanded from macro 'IMPL_COLL_FUNC'h reads), 391t | i d IRnuBnlWoocrkk( , N CsCtLe_pASLiGzOe_(#n#cacllgSoh,m eNmC.CcLo_mPmR.ObTuOf_f#S#ipzreost[oN>C(C)L._rPuRnO(T&On_cScIlMSPhLmEe]m/.NwCoCrLk_)S;T E\P S /| s ^i zeof(T)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h): 562{: 15 :| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~note: field 'nthreads' will be initialized after field 'tidInBlock' | group(group 562 | tid(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hi:d655):,11 :n tnote: hin instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herer eads(nt h655r | e a d s ) , t i d IpnrBilmosc(kt(itdh-rteiaddSItdaxr.txR)e,d ugcreo,u pn(Tghrroeuapd)s,R e d| u ^~~~~~~~~~~~~~~~~c e, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:u562l:l60p:t rnote: ,field 'group' will be initialized after field 'stepSize' &direc t562- | > o u t ,t iadr(gtsi-d>)s,e nndtbhurfefa,d sa(rngtsh-r>eraedcsv)b,u ftfi,d I n| B ^l ock(thre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ha:d202I:d53x:. xnote: )in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here, gro u202 | p ( g r o u p )R,u n W| o ^~~~~~~~~~~r kElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##alg/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:,562 :N15C:C Lwarning: _initializer order does not match the declaration order [-Wreorder-ctor]P ROTO_##proto>().run(& n562c | c l S h mteimd.(wtoirdk)),; n\t h r| e ^a ds(nt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hh:r562e:a15d:s )note: ,field 'nthreads' will be initialized after field 'tidInBlock' tidInB l562o | c k ( t htrieda(dtIiddx).,x )n,t hgrreoaudps((gnrtohurpe)a,d s )| , ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ t i| d tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)I nBlock (563t | h r e a dsItdexp.Sxi)z,e (gnrcoculpS(hgmreomu.pc)o,m m .| b ^~~~~~~~~~~~~~~~~u ff/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hS:i562z:e60s:[ Nnote: Cfield 'group' will be initialized after field 'stepSize'C L_PRO T562O | _ S I M PtLiEd](/tNiCdC)L,_ SnTtEhPrSe/asdisz(enotfh(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h562::67715::11 :warning: initializer order does not match the declaration order [-Wreorder-ctor]note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | 562 | tpirdi(mtsi(dt)i,d -nttihdrSetaadrst(Bnctahsrte,a dnsT)h,r etaiddsIBncBalsotc,k (&tdhirreeacdtI-d>xo.uxt),, dgirroeucpt(-g>rdoouwpn),, a r| g ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~s - >| s tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)e ndbuff ,563 | a r g s -s>treepcSvibzuef(fn,c c l| S ^h mem.comm/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h.:b202u:f53f:S inote: zin instantiation of member function 'RunWorkElement, 2, 2>::run' requested heree s[NC C202L | _ P R O T O _ S IRMuPnLWEo]r/kNEClCeLm_eSnTtE().run(w/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.he:)626;: 9 :| ^note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp :6269 | : 1 : note: in instantiation of member function 'RunWork, 2, 2>::run' requested here pri m9s | (ItMiPdL-_tCiOdLSLt_aFrUtNSCc(aAtltleRre,d uncTeh,r eCaOdLsLSNcEaTt_tDeIrR,E CNTU,L LS,I MdPiLrEe,c tP-r>oudp,, uairngts6-4>_ste)n d b| u^f f, arg/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hs:-391>:r95e:c vnote: bexpanded from macro 'IMPL_COLL_FUNC'u ff, | ^ 391 | R/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hu:n202W:o53r:k , 2, 2>::run' requested herec clFu n202c | # # f u n c , tRyupneW,o rFkuEnlce#m#ednetvO,p ,N CAClLg_oA,L GPOr_o#t#oa>l(g)o.,r uNnC(CwLe_)P;R O T| O ^_ ##proto>/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp(:)10.:r1u:n (note: &in instantiation of member function 'RunWork, 2, 2>::run' requested heren cclSh m10e | mI.MwPoLr_kC)O;L L\_ F U| N ^C (AllRe/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:u562c:e15,: Cnote: Ofield 'nthreads' will be initialized after field 'tidInBlock'L LNET_ D562I | R E C T ,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCtCL_STEPS/sizeiodf((tTi)d)) ,{ n t| h ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r e a| d group(groups (nthreads), tidIn/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hB:l655o:c11k:( tnote: hin instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herer eadIdx. x655) | , g r o u p ( g r opurpi)m,s ( t| i ^~~~~~~~~~~~~~~~~d -tidStartReduce, nThreadsRed/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:c562e:,60 :n unote: lfield 'group' will be initialized after field 'stepSize'l ptr, &direct-> o562u | t , a rtgisd-(>tsiedn)d,b unftfh,r eaardgss(-n>trhercevabdusf)f,, t i| d ^I nBlock(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:h202r:e53a:d Inote: din instantiation of member function 'RunWorkElement, 2, 2>::run' requested herex .x), g202r | o u p ( g r o u pR)u,n W o| r ^~~~~~~~~~~k Element().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | srtepSize(necccvlbSuhfmfe,m . c| o ^m m.buffSizes[NCCL_PROTO_SIM/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hP:L202E:]53/:N Cnote: Cin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereL _STEPS/siz e202o | f ( T ) ) { R| u ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~n W o| r group(groupk Element, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here, Proto> (655) | . r u n ( w e ) ; p| r ^i ms(tid-t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cppi:d9S:t1a:r tnote: Rin instantiation of member function 'RunWork, 2, 2>::run' requested heree duce, 9n | TIhMrPeLa_dCsORLeLd_uFcUeN,C (nAullllRpetdru,c e&,d iCrOeLcLtN-E>To_uDtI,R EaCrTg,s -S>IsMePnLdEb,u fPfr,o da,r gusi-n>tr6e4c_vtb)u f f| ,^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h95::202 :note: 53expanded from macro 'IMPL_COLL_FUNC': note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 391202 | | R u n W o r kRe(>),. rNuCnC(Lw_eA)L;G O _| ^# #algo, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cppN:C9C:L1_:P Rnote: Oin instantiation of member function 'RunWork, 2, 2>::run' requested hereT O_##p r9o | tIoM>P(L)_.CrOuLnL(_&FnUcNcCl(SAhlmleRme.dwuocrek,) ;C O\L L N| E ^T _DIRECT, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hS:I562M:P15L:E ,note: field 'nthreads' will be initialized after field 'tidInBlock'P rod, uin t5626 | 4 _ t ) t i| d^( tid), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hn:t391h:r95e:a dnote: sexpanded from macro 'IMPL_COLL_FUNC'( nthread s391) | , tRiudnIWnoBrlko:, note: Nfield 'group' will be initialized after field 'stepSize'C CL_ALG O562_ | # # a l gtoi,d (NtCiCdL)_,P RnOtThOr_e#a#dpsr(onttoh>(r).run(&ncecaldSsh)m,e mt.iwdoIrnkB)l;o c\k ( t| h ^r eadIdx.x), group(grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hp:)562,: 15 :| ^~~~~~~~~~~note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, N/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ CCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ endbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h | : 562 : 15 :t iwarning: dinitializer order does not match the declaration order [-Wreorder-ctor]( tid), nthread s562( | n t h r etaidd(st)i,d )t,i dnItnhBrleoacdks((tnhtrheraedaIddsx).,x )t,i dgIrnoBulpo(cgkr(otuhpr)e,a d I| d ^~~~~~~~~~~~~~~~~x .x/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h):,562 :g60r:o unote: pfield 'group' will be initialized after field 'stepSize'( group) ,562 | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ t| i tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)d (tid), 563n | t h r e asdtse(pnStihzree(andcsc)l,S htmiedmI.ncBolmomc.kb(utfhfrSeiazdeIsd[xN.CxC)L,_ PgRrOoTuOp(_gSrIoMuPpL)E,] / N| C ^~~~~~~~~~~C L_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcas/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht,: 562&:d15i:r ewarning: cinitializer order does not match the declaration order [-Wreorder-ctor]t ->out, direct->d o562w | n , a trigds(-t>isde)n,db unftfh,r eaardgss(-n>trhercevabdusf)f,, t i| d ^I nBlock/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h(:t202h:r53e:a dnote: Iin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hered x.x), 202g | r o u p ( g r o uRpu)n,W o r| k ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~E l e| m tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)e nte(m)..croumnm(.wbeu)f;f S i| z ^e s[NCCL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cppP:R11O:T1O:_ Snote: Iin instantiation of member function 'RunWork, 2, 2>::run' requested hereM PLE] /11N | CICMLP_LS_TCEOPLSL/_sFiUzNeCo(fA(lTl)R)e d{u c e| , ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ C O| L group(groupL NET_DIRECT, SIMPL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hE:,655 :P11r:o dnote: ,in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here float) 655| | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 391 : 95 :p rnote: iexpanded from macro 'IMPL_COLL_FUNC'm s(tid-t i391d | S t aRrutnRWeodrukca,r gNsC-C>Ls_eAnLdGbOu_f#f#,a lagrog,s -N>CrCeLc_vPbRuOfTfO,_ # #| p ^r oto>().r/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hu:n202(:&53n:c cnote: lin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereS hmem. w202or | k ) ; \ | ^R unWor/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hk:E562l:e15m:e nnote: tfield 'nthreads' will be initialized after field 'tidInBlock'< Fn, T, 562R | e d O p ,t iAdl(gtoi,d )P,r onttoh>r(e)a.drsu(nn(twher)e;a d s| ) ^, tidInB/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cppl:o10c:k1(:t hnote: rin instantiation of member function 'RunWork, 2, 2>::run' requested heree adIdx .10x | )I,M PgLr_oCuOpL(Lg_rFoUuNpC)(,A l l| R ^~~~~~~~~~~~~~~~~e du/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hc:e562,: 60C:O Lnote: Lfield 'group' will be initialized after field 'stepSize'N ET_DIR E562C | T , S ItMiPdL(Et,i dP)r, ondt,h rheaaldfs)( n t| h^r eads)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h,: 391t:i95d:I nnote: Bexpanded from macro 'IMPL_COLL_FUNC'l ock( t391h | r e aRduIndWxo.rxk)<,n cgcrloFuupn(cg#r#ofuupn)c,, t| y ^~~~~~~~~~~p e, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/:N562C:C15L:_ Swarning: Tinitializer order does not match the declaration order [-Wreorder-ctor]E PS/sizeof(T)) { 562| | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(groupt id(tid), nthreads(nthreads), tidInBlo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hc:k677(:t11h:r enote: ain instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hered Idx.x), g677r | o u p ( g r o u p ) ,p r i| m ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~s ( t| i tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)d -tidSt a563r | t B c a sstt,e pnSTihzree(andcscBlcSahsmte,m .&cdoimrme.cbtu-f>foSuitz,e sd[iNrCeCcLt_-P>RdOoTwOn_,S IaMrPgLsE-]>/sNeCnCdLb_uSfTfE,P Sa/rsgisz-e>orfe(cTv)b)u f{f , | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~| ^ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hnote: :in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here666 :9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here202 | 666 | R u n W o r kpErliemmse(ntti>(u)p.,r uNnU(LwLe); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:t562h:r15e:a dwarning: sinitializer order does not match the declaration order [-Wreorder-ctor]) , tidInBlock(thre a562d | I d x . x)t,i dg(rtoiudp)(,g rnotuhpr)e,a d s(| n ^~~~~~~~~~~t hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##pro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ to>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h::562641::1511:: warning: note: initializer order does not match the declaration order [-Wreorder-ctor]in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | 562 | t i d (ptriidm)s,( tnitdh-rteiaddSst(artReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, fl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oat) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_P/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ StartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWorkwarning: ,initializer order does not match the declaration order [-Wreorder-ctor] NCCL_ALGO_##algo, 562N | C C L _ PtRiOdT(Ot_i#d#)p,r onttoh>r(e)a.drsu(nn(t&hnrcecaldSsh)m,e mt.iwdoIrnkB)l;o c\k ( t| h ^r eadId/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hx:.562x:)15,: gnote: rfield 'nthreads' will be initialized after field 'tidInBlock'o up(gro u562p | ) , | t ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~i d (| t tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)i d), nt h563r | e a d s (snttehprSeiazdes()n,c ctliSdhImneBml.occokm(mt.hbruefafdSIidzxe.sx[)N,C CgLr_oPuRpO(TgOr_oSuIpM)P,L E ]| / ^~~~~~~~~~~~~~~~~N CCL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h_:S562T:E60P:S /note: sfield 'group' will be initialized after field 'stepSize'i zeof(T )562) | { | t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~i d (| t group(groupi d), nthreads(nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hr:e687a:d11s:) ,note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heret idInBlo c687k | ( t h r e a d I d x .pxr)i,m sgr(otuipd(-gtrioduSpt)a,r t B| c ^~~~~~~~~~~a st, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS//usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :warning: 677initializer order does not match the declaration order [-Wreorder-ctor]: 11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 562677 | | t i d ( t i dp)r,i mnst(htrieda-dtsi(dnthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ StartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().r/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:n(we);562 : 15| : ^ warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13562 | | I M P L _tCiOdL(Lt_iFdU)N,C (nAtlhlrReeaddusc(en,t hCrOeLaLdNsE)T,_ DtIiRdEICnTB,l oScIkM(PtLhEr,e aPdrIoddx,. xr)c,c lg_rbofulpo(agtr1o6u)p ) ,| ^ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)391 :95: note: expanded from macro 'IMPL_COLL_FUNC' 563 | s t391e | p S iRzuen(WnocrcklC,L _NSCTCELP_SA/LsGiOz_e#o#fa(lTg)o), {N C C| L ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~_ P R| O group(groupT O_##proto>().run(&ncclS/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hh:m655e:m11.:w onote: rin instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herek ); \ | ^655 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 : 15 : pnote: rfield 'nthreads' will be initialized after field 'tidInBlock'i ms(ti d562- | t i d S ttairdt(Rteiddu)c,e ,n tnhTrheraedasd(snRtehdruecaed,s )n,u ltlipdtIrn,B l&odcikr(etchtr-e>aoduItd,x .axr)g,s -g>rsoeunpd(bgurfofu,p )a,r g s| - ^~~~~~~~~~~~~~~~~> rec/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hv:b562u:f60f:, note: field 'group' will be initialized after field 'stepSize'| ^ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 202 :t53i:d (note: tin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herei d), n202t | h r e a d s ( n tRhurneWaodrsk)E,l etmiednItng(r)o.urpu)n,( w e| ) ^~~~~~~~~~~; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx90a. 67 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 67 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :p562r:i15m:s (warning: tinitializer order does not match the declaration order [-Wreorder-ctor]i d-tidStartBcas t562, | n T h readsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for host. 67 warnings generated when compiling for gfx908. 67 warnings generated when compiling for gfx90a. 67 warnings generated when compiling for gfx941. 67 warnings generated when compiling for gfx1102. 67 warnings generated when compiling for gfx1100. 67 warnings generated when compiling for gfx803. 67 warnings generated when compiling for gfx1030. 67 warnings generated when compiling for gfx906. 67 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElemen/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->In file included from o/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppu:t1,: In file included from d/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hi:r10e: cIn file included from t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h-:>167d: o/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hw:n562,: 15a:r gwarning: sinitializer order does not match the declaration order [-Wreorder-ctor]- >sendbuff, args- >562r | e c v b utfifd,( t i| d ^) , nthre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ha:d202s:(53n:t hnote: rin instantiation of member function 'RunWorkElement, 2, 2>::run' requested heree ads), 202t | i d I n B l o c kR(utnhWroerakdEIldexm.exn)t,< Fgnr,o uTp,( gRreoduOpp),, A l| g ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~o , | P tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)r oto>(). r563u | n ( w e )s;t e p| S ^i ze(nccl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppS:h4m:e1m:. cnote: oin instantiation of member function 'RunWork, 2, 2>::run' requested herem m.buf f4S | iIzMePsL[_NCCOCLLL__PFRUONTCO(_ASlIlMRPeLdEu]c/eN,C CCLO_LSLTNEEPTS_/DsIiRzEeCoTf,( T)S)I M{P L E| , ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ M a| x group(group, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h626::3919::95 :note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herenote: expanded from macro 'IMPL_COLL_FUNC' 626 | 391 | R u n WporrikmL,L ,N CdCiLr_eAcLtG-O>_u#p#,a lagrog,s -N>CsCeLn_dPbRuOfTfO,_ #a#rpgrso-t>or>e(c)v.bruufnf(,& n c| c ^l Shmem/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h.:w202o:r53k:) ;note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here\ | ^ 202 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 : 15 :R unote: nfield 'nthreads' will be initialized after field 'tidInBlock'W orkElem e562n | t < F n ,t iTd,( tRiedd)O,p ,n tAhlrgeoa,d sP(rnotthor>e(a)d.sr)u,n (twied)I;n B l| o ^c k(threa/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppd:I4d:x1.:x )note: ,in instantiation of member function 'RunWork, 2, 2>::run' requested here group (4g | rIoMuPpL)_,C O L| L ^~~~~~~~~~~~~~~~~_ FUN/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hC:(562A:l60l:R enote: dfield 'group' will be initialized after field 'stepSize'u ce, CO L562L | N E T _ DtIiRdE(CtTi,d )S,I MnPtLhEr,e aMdasx(,n tihnrte8a_dts)) , | t^i dInBl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ho:c391k:(95t:h rnote: eexpanded from macro 'IMPL_COLL_FUNC'a dIdx.x), 391g | r o uRpu(ngWroorukp<)n,c c l| F ^~~~~~~~~~~u nc##func, type, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ t().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ cclFunc##func, type, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15:: 562warning: :initializer order does not match the declaration order [-Wreorder-ctor]15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | 562t | i d ( t itdi)d,( tnitdh)r,e andtsh(rnetahdrse(andtsh)r,e atdisd)I,n BtliodcIkn(Btlhorceka(dtIhdrxe.axd)I,d xg.rxo)u,p (ggrroouupp()g,r o u| p ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~) , | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | 563s | t e p S isztee(pnSciczleS(hnmcecml.Schommemm..bcuofmfmS.ibzuefsf[SNiCzCeLs_[PNRCOCTLO__PSRIOMTPOL_ES]I/MNPCLCEL]_/SNTCECPLS_/SsTiEzPeSo/fs(iTz)e)o f{( T )| ) ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ { | group(group| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h::11641:: 11note: :in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | 641 | p r i mpsr(itmisd(-ttiidd-SttiadrSttRaerdtuRceed,u cneT,h rneTahdrseRaeddsuRceed,u cneu,l ldpitrre,c t&-d>idroewcnt,- >&oduitr,e catr-g>so-u>ts,e nadrbgusf-f>,s eanrdgbsu-f>fr,e cavrbgusf-f>,r e c| v ^b uff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hin instantiation of member function 'RunWorkElement, 2, 2>::run' requested here: 202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here202 | 202 | R u n W o r kREulneWmoernktE (P)r.ortuon>((w)e.)r;u n (| w ^e ); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:: 4note: :in instantiation of member function 'RunWork, 2, 2>::run' requested here1 : note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IM P4L | _ICMOPLLL__CFOULNLC_(FAUlNlCR(eAdlulcRee,d uCcOeL,L NCEOTL_LDNIERTE_CDTI,R ESCITM,P LSEI,M PMLaEx,, Muaixn,t 8i_ntt)8 _ t| )^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::95391:: 95note: :expanded from macro 'IMPL_COLL_FUNC' note: expanded from macro 'IMPL_COLL_FUNC' 391 | 391 | R u nRWuonrWkop,e >N,C CNLC_CALL_GAOL_G#O#_a#l#gaol,g oN,C CNLC_CPLR_OPTROO_T#O#_p#r#optroo>t(o)>.(r)u.nr(u&nn(c&cnlcSchlmSehmm.ewmo.rwko)r;k )\; \| ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h562::56215::15 :note: field 'nthreads' will be initialized after field 'tidInBlock'note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | 562 | t itdi(dt(itdi)d,) ,n tnhtrheraedasd(sn(tnhtrheraedasd)s,) ,t itdiIdnIBnlBolcokc(kt(htrheraedaIddIxd.xx.)x,) ,g rgoruopu(pg(rgoruopu)p,) , | ^~~~~~~~~~~~~~~~~| ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h562::56260::60 :note: field 'group' will be initialized after field 'stepSize'note: field 'group' will be initialized after field 'stepSize' 562 | 562 | t itdi(dt(itdi)d,) ,n tnhtrheraedasd(sn(tnhtrheraedasd)s,) ,t itdiIdnIBnlBolcokc(kt(htrheraedaIddIxd.xx.)x,) ,g rgoruopu(pg(rgoruopu)p,) , | ^~~~~~~~~~~| ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##p/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:o562t:o15>:( )warning: .initializer order does not match the declaration order [-Wreorder-ctor]r un(&ncclShm e562m | . w o r kt)i;d (\t i d| ) ^, nthre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ha:d562s:(15n:t hnote: rfield 'nthreads' will be initialized after field 'tidInBlock' e562a | d s ) , ttiidd(ItniBdl)o,c kn(tthhrreeaaddsI(dnxt.hxr)e,a dgsr)o,u pt(igdrIonuBpl)o,c k (| t ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~h r e| a tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)d Idx.x) ,563 | g r o u ps(tgerpoSuipz)e,( n c| c ^~~~~~~~~~~~~~~~~l Shm/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:m562.:c60o:m note: mfield 'group' will be initialized after field 'stepSize'. buffSi z562e | s [ N C CtLi_dP(RtOiTdO)_,S InMtPhLrEe]a/dNsC(CnLt_hSrTeEaPdSs/)s,i zteiodfI(nTB)l)o c{k ( t| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~h r e| a group(groupd Idx.x), grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hp:(677g:r11o:u pnote: )in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here, | ^~~~~~~~~~~ 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562R:u15n:W owarning: rinitializer order does not match the declaration order [-Wreorder-ctor]k Elementn(t)h.rreuand(sw(en)t;h r e| a ^d s), tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppI:n4B:l1o:c knote: (in instantiation of member function 'RunWork, 2, 2>::run' requested heret hread I4d | xI.MxP)L,_ CgOrLoLu_pF(UgNrCou(pA)l,l R e| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~u c e| , tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) COLLNE T563_ | D I R E CsTt,e pSSIiMzPeL(En,c cMlaSxh,m eimn.tc8o_mtm). b u| f^f Sizes/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h[:N391C:C95L:_ Pnote: Rexpanded from macro 'IMPL_COLL_FUNC'O TO_SIMPL E391] | / N CRCuLn_WSoTrEkP11,: Nnote: Cin instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereC L_ALGO_ #687# | a l g o , N C C L _pPrRiOmTsO(_t#i#dp-rtoitdoS>t(a)r.trBucna(s&tn,c cnlTShhrmeeamd.swBocraks)t;, \& d | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15i:r ewarning: cinitializer order does not match the declaration order [-Wreorder-ctor]t ->out, nullptr ,562 | a r g s -t>isde(ntdibdu)f,f ,n tahrrgesa-d>sr(enctvhbruefafd,s ) ,| ^t idInBlock(threadIdx.x), g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:o202u:p53(:g rnote: oin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereu p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ 202| | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) R563u | n W o r ksEtleepmSeinzte<(Fnnc,c lTS,h mReemd.Ocpo,m mA.lbguof,f SPirzoetso[>N(C)C.Lr_uPnR(OwTeO)_;S I M| P ^L E]/NCCL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppS:T5E:P1S:/ snote: iin instantiation of member function 'RunWork, 2, 2>::run' requested herez eof(T )5) | I{M P L| _ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~C O L| L group(group_ FUNC(AllReduc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.he:,666 :C9O:L Lnote: Nin instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereE T_DIREC T666, | S I M P L E , pMraixm,s (utiindt,8 _ntT)h r e| a^d sGather,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :d391i:r95e:c tnote: -expanded from macro 'IMPL_COLL_FUNC'> up, NULL ,391 | a r gRsu-n>Wsoernkdurnecc,v btuyfpfe,, F| u ^n c##devr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:d202o:p53<:t ynote: pin instantiation of member function 'RunWorkElement, 2, 2>::run' requested heree >, NC C202L | _ A L G O _ # # aRlugnoW,o rNkCEClLe_mPeRnOtTd(O)p.,r uAnl(g&on,c cPlrSohtmoe>m(.)w.orrukn)(;w e\) ; | ^| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::4562::115:: note: note: in instantiation of member function 'RunWork, 2, 2>::run' requested herefield 'nthreads' will be initialized after field 'tidInBlock' 4 | I M562P | L _ C O LtLi_dF(UtNiCd()A,l lnRtehdruecaed,s (CnOtLhLrNeEaTd_sD)I,R EtCiTd,I nSBIlMoPcLkE(,t hMraexa,d Iidnxt.8x_)t,) g r| o^u p(gro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hu:p391):,95 : | note: ^~~~~~~~~~~~~~~~~expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60 :391 | note: field 'group' will be initialized after field 'stepSize' RunWor k562< | n c c l Ftuindc(#t#ifdu)n,c ,n tthyrpeea,d sF(unntch#r#edaedvsr)e,d otpio,c kN(CtChLr_eAaLdGIOd_x#.#xa)l,g og,r oNuCpC(Lg_rPoRuOpT)O,_ # #| p ^~~~~~~~~~~r oto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_CO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ LL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &dir/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:c562t:-15>:o uwarning: tinitializer order does not match the declaration order [-Wreorder-ctor], args->sendbuff, args -562> | r e c v btuifdf(,t i d| ) ^, nthread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hs:(202n:t53h:r enote: ain instantiation of member function 'RunWorkElement, 2, 2>::run' requested hered s), t i202d | I n B l o c k ( tRhurneWaodrIkdExl.exm)e,n tg (563) | . r u n (swtee)p;S i z| e ^( ncclShme/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppm:.5c:o1m:m .note: bin instantiation of member function 'RunWork, 2, 2>::run' requested hereu ffSiz e5s | [INMCPCLL__CPORLOLT_OF_USNICM(PALlEl]R/eNdCuCcLe_,S TCEOPLSL/NsEiTz_eDoIfR(ETC)T), {S I M| P ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~L E ,| group(groupM ax, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h::95641:: 11note: :expanded from macro 'IMPL_COLL_FUNC' note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 391 | 641 | R u n W o r k < n c cplrFiumnsc(#t#ifdu-ntci,d Sttyapret,R eFduuncce#,# dneTvhrreedaodpse,, NdCiCrLe_cAtL-G>Od_o#w#na,l g&od,i rNeCcCtL-_>PoRuOtT,O _a#r#gpsr-o>tsoe>n(d)b.urfufn,( &anrcgcsl-S>hrmeecmv.bwuofrfk,) ; | \ ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h202::56253::15 :note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested herenote: field 'nthreads' will be initialized after field 'tidInBlock' 202 | 562 | tRiudn(Wtoirdk)E,l enmtehnrtet(h)r.eraudnI(dwxe.)x;) , | g ^r oup(grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppp:)6,: 1 :| ^~~~~~~~~~~~~~~~~note: in instantiation of member function 'RunWork, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562: 606: | Inote: Mfield 'group' will be initialized after field 'stepSize'P L_COLL _562F | U N C ( AtlildR(etdiudc)e,, nCtOhLrLeNaEdTs_(DnItRhErCeTa,d sS)I,M PtLiEd,I nMBalxo,c ki(ntth3r2e_atd)I d x| .^x ), group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h(:g391r:o95u:p )note: ,expanded from macro 'IMPL_COLL_FUNC' | ^~~~~~~~~~~ 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h11::562 :note: 15in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here: warning: initializer order does not match the declaration order [-Wreorder-ctor] 655 | prim s562( | t i d - ttiiddS(ttairdt)R,e dnutcher,e andTsh(rnetahdrseRaeddsu)c,e ,t induIlnlBpltorc,k (&tdhirreeacdtI-d>xo.uxt),, agrrgosu-p>(sgernodubpu)f,f , | a ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~r g s| - tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)> recvbu f563f | , | ^s tepSize(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hn:c202c:l53S:h mnote: ein instantiation of member function 'RunWorkElement, 2, 2>::run' requested herem .comm .202b | u f f S i z e s [RNuCnCWLo_rPkREOlTeOm_eSnItM ({) . r| u ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~n ( w| e group(group) ; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :655:11: 6note: | in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereI MPL_COL L655_ | F U N C ( A l l R e dpurciem,s (CtOiLdL-NtEiTd_SDtIaRrEtCRTe,d uScIeM,P LnET,h rMeaaxd,s Riendtu3c2e_,t )n u l| l^p tr, &di/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:e391c:t95-:> onote: uexpanded from macro 'IMPL_COLL_FUNC't , args-> s391e | n d bRuufnfW,o rakrlrFeucnvcb#u#fffu,n c, type, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:A562l:l15R:e dwarning: uinitializer order does not match the declaration order [-Wreorder-ctor]c e, COLLNET_DIRECT ,562 | S I M P LtEi,d (Mtaixd,) ,i nntt3h2r_eta)d s (| n^t hread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hs:)391,: 95t:i dnote: Iexpanded from macro 'IMPL_COLL_FUNC'n Block(th r391e | a d IRduxn.Wxo)r,k (,n cNcClCSLh_mAeLmG.Oc_o#m#ma.lbguof,f SNiCzCeLs_[PNRCOCTLO__P#R#OpTrOo_tSoI>M(P)L.Er]u/nN(C&CnLc_cSlTSEhPmSe/ms.iwzoerokf)(;T )\) {| ^ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h group(group: 562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 666 : 9t:i dnote: (in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heret id), n t666h | r e a d s ( n t hprreiamdss()t,i dt,i dnITnhBrleoacdks(Gtahtrheeard,I ddxi.rxe)c,t -g>ruopu,p (NgUrLoLu,p )a,r g s| - ^~~~~~~~~~~~~~~~~> sen/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:b562u:f60f:, note: afield 'group' will be initialized after field 'stepSize'r gs->re c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h562v: | b562 u: f15 f: , t warning: i initializer order does not match the declaration order [-Wreorder-ctor]d| ( ^t id), n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht: h202562r: | e53 a: d snote: (in instantiation of member function 'RunWorkElement, 2, 2>::run' requested heretn itdh( rt202ei | ad d) s, ) ,n t thriedaIdnsB(lnotchkr(etahdrse)a,d Itdixd.Ixn)B,l ogcrko(utph(rgeraoduIpd)x,. x )| , ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, C/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ OLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/siz/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.heof(T)): 562{: 15 :| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~warning: initializer order does not match the declaration order [-Wreorder-ctor] | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :562641 | : 11 : note: tin instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herei d(tid), n641t | h r e a d s ( n threads), tpirdiImnsB(ltoicdk-(ttihdrSetaadrItdRxe.dxu)c,e ,g rnoTuhpr(egardosuRpe)d,u c e| , ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ d i| r tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)e ct->dow n563, | & d i rsetcetp-S>iozuet(,n cacrlgSsh-m>esme.ncdobmumf.fb,u fafrSgisz-e>sr[eNcCvCbLu_fPfR,O T O| _ ^S IMPLE]/N/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hC:C202L:_53S:T Enote: Pin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereS /size o202f | ( T ) ) { | R ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~u n W| o group(groupr kElement, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereo to>().r u666n | ( w e ) ; | ^p rims(ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppd:,7 :n1T:h rnote: ein instantiation of member function 'RunWork, 2, 2>::run' requested herea dsGat h7e | rI,M PdLi_rCeOcLtL-_>FuUpN,C (NAUlLlLR,e daurcges,- >CsOeLnLdNbEuTf_fD,I RaErCgTs,- >SrIeMcPvLbEu,f fM,a x ,| ^u int32_t) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h| :^202 :53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: 202note: | expanded from macro 'IMPL_COLL_FUNC' R u391n | W o rRkuEnlWeomrekn#(d)e.vrruend(owpe<)t;y p e| > ^, NCCL_AL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppG:O6_:#1#:a lnote: gin instantiation of member function 'RunWork, 2, 2>::run' requested hereo , NCC L6_ | PIRMOPTLO__C#O#LpLr_oFtUoN>C(()A.lrluRne(d&unccec,l SChOmLeLmN.EwTo_rDkI)R;E C\T , | S ^I MPLE,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :M562a:x15,: inote: nfield 'nthreads' will be initialized after field 'tidInBlock't 32_t) 562| | ^ tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h(:t391i:d95):, note: nexpanded from macro 'IMPL_COLL_FUNC't hreads(nt h391r | e a dRsu)n,W otrikd/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h,: 562N:C60C:L _note: Afield 'group' will be initialized after field 'stepSize'L GO_##a l562g | o , N CtCiLd_(PtRiOdT)O,_ #n#tphrroetaod>s(()n.trhurne(a&dnsc)c,l SthimdeImn.Bwloorckk)(;t h\r e a| d ^I dx.x), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hg:r562o:u15p:( gnote: rfield 'nthreads' will be initialized after field 'tidInBlock'o up), | ^~~~~~~~~~~562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElem/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ent().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hRunWor:k562E:l15e:m ewarning: ninitializer order does not match the declaration order [-Wreorder-ctor]t ( ) .triudn((twied));, n| t ^h reads(nthreads), tidInBlock(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpph:r5e:a1d:I dnote: xin instantiation of member function 'RunWork, 2, 2>::run' requested here. x), gro u5p | (IgMrPoLu_pC)O,L L _| F ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~U N C| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)A llRedu c563e | , C O LsLtNeEpTS_iDzIeR(EnCcTc,l SShImMePmL.Ec,o mMma.xb,u fufiSnitz8e_st[)N C C| L^_ PROTO_SI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hM:P391L:E95]:/ Nnote: Cexpanded from macro 'IMPL_COLL_FUNC'C L_STEPS/s i391z | e o fR(uTn)W)o r{k < n| c ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~c l F| u group(groupn c##func, type, Func##d/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.he:v677r:e11d:o pnote: , FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heret ype>, NCC L677_ | A L G O _ # # a l g op,r iNmCsC(Lt_iPdR-OtTiOd_S#t#aprrtoBtcoa>s(t),. rnuTnh(r&enacdcslBSchamsetm,. w&odrikr)e;c t\- > o| u ^t , direct->d/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:w562n:,15 :a rnote: gfield 'nthreads' will be initialized after field 'tidInBlock's ->sendb u562f | f , a rtgisd-(>triedc)v,b unftfh,r e a| d ^s (nthread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hs:)202,: 53t:i dnote: Iin instantiation of member function 'RunWorkElement, 2, 2>::run' requested heren Block (202t | h r e a d I d x .Rxu)n,W ogrrkoEulpe(mgernotu (562) | . r u n (twied)(;t i d| ) ^, nthread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpps:(7n:t1h:r enote: ain instantiation of member function 'RunWork, 2, 2>::run' requested hered s), t i7d | IInMBPlLo_cCkO(LtLh_rFeUaNdCI(dAxl.lxR)e,d ugcreo,u pC(OgLrLoNuEpT)_,D I R| E ^~~~~~~~~~~C T, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_F/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hUN:C562(:A15l:l Rwarning: einitializer order does not match the declaration order [-Wreorder-ctor]d uce, COLLNET_DIR E562C | T , S ItMiPdL(Et,i dM)a,x ,n tihnrte3a2d_st()n t h| r^e ads), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:i391d:I95n:B lnote: oexpanded from macro 'IMPL_COLL_FUNC'c k(thread I391d | x . xR)u,n Wgorrokul,S hNmCeCmL._cAoLmGmO._b#u#faflSgioz,e sN[CNCCLC_LP_RPORTOOT_O#_#SpIrMoPtLoE>](/)N.CrCuLn_(S&TnEcPcSl/Sshimzeemo.fw(oTr)k)) ;{ \ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~| ^ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :562687 | : 11 : note: tin instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herei d(tid), 687n | t h r e a d s ( n t hprreiamdss()t,i dt-itdiIdnSBtlaorctkB(ctahsrte,a dnITdhxr.exa)d,s Bgcraosutp,( g&rdoiurpe)c,t - >| o ^~~~~~~~~~~~~~~~~u t,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :n562u:l60l:p tnote: rfield 'group' will be initialized after field 'stepSize', args- >562s | e n d b utfifd,( tairdg)s,- >nrtehcrvebaudfsf(,n t h| r ^e ads), t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hi:d202I:n53B:l onote: cin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herek (thre a202d | I d x . x ) , gRroup(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ unWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hi:z562e:o15f:( Twarning: )initializer order does not match the declaration order [-Wreorder-ctor]) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 562 | tid(tid), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hn:t641h:r11e:a dnote: sin instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here( nthreads )641, | t i d I n B l o c kp(rtihmrse(atdiIdd-xt.ixd)S,t agrrtoRuepd(ugcreo,u pn)T,h r e| a ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~d s R| e tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)d uce, d i563r | e c t - >sdtoewpnS,i z&ed(inrceccltS-h>moeumt.,c oamrmg.sb-u>fsfeSnidzbeusf[fN,C CaLr_gPsR-O>TrOe_cSvIbMuPfLfE,] / N| C ^C L_STEPS/s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hi:z202e:o53f:( Tnote: )in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~202 | | group(group RunWorkElem/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.he:n626t:<9F:n ,note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereT , RedOp ,626 | A l g o , P r optroi>m(s)(.triudn-(twied)S;t a r| t ^S catter, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppn:T6h:r1e:a dnote: sin instantiation of member function 'RunWork, 2, 2>::run' requested hereS catte r6, | INMUPLLL_,C OdLiLr_eFcUtN-C>(uApl,l Raerdgusc-e>,s eCnOdLbLuNfEfT,_ DaIrRgEsC-T>,r eScIvMbPuLfEf,, M a| x ^, int32/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h_:t202): 53 :| ^note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :202391 | : 95 : note: expanded from macro 'IMPL_COLL_FUNC' RunWor k391E | l e mReunntWF(u)n.cr#u#nd(ewver)e;d o p| < ^t ype>, N/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppC:C6L:_1A:L Gnote: Oin instantiation of member function 'RunWork, 2, 2>::run' requested here_ ##alg o6, | INMCPCLL__CPORLOLT_OF_U#N#Cp(rAoltloR>e(d)u.creu,n (C&OnLcLcNlESTh_mDeImR.EwCoTr,k )S;I M\P L E| , ^ Max, in/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:35622:_15t:) note: field 'nthreads' will be initialized after field 'tidInBlock'| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h562: | 391 : 95 : tnote: iexpanded from macro 'IMPL_COLL_FUNC'd (tid), n t391h | r e aRdusn(Wnotrhkru,p (NgCrCoLu_pA)L,G O _| # ^~~~~~~~~~~~~~~~~# algo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h,: 562N:C60C:L _note: Pfield 'group' will be initialized after field 'stepSize'R OTO_## p562r | o t o > (t)i.dr(utni(d&)n,c cnltShhrmeeamd.sw(onrtkh)r;e a\d s )| , ^ tidIn/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hB:l562o:c15k:( tnote: hfield 'nthreads' will be initialized after field 'tidInBlock'r eadIdx .562x | ) , g rtoiudp((tgirdo)u,p )n,t h r| e ^~~~~~~~~~~a ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().ru n562( | w e ) ; t i| d ^( tid), nt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpph:r7e:a1d:s (note: nin instantiation of member function 'RunWork, 2, 2>::run' requested heret hread s7) | ,I MtPiLd_ICnOBLlLo_cFkU(NtCh(rAelaldRIeddxu.cxe),, CgOrLoLuNpE(Tg_rDoIuRpE)C,T , | S ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~I M P| L tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)E , Max, u563i | n t 3 2 _stt)e p S| i^z e(ncclS/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hh:m391e:m95.:c onote: mexpanded from macro 'IMPL_COLL_FUNC'm .buffSiz e391s | [ N CRCuLn_WPoRrOkT, NCCL_ALGO_##/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ha:l655g:o11,: Nnote: Cin instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereC L_PROTO_ #655# | p r o t o > ( ) . r upnr(i&mnsc(ctliSdh-mteimd.Swtoarrkt)R;e d\u c e| , ^ nThread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hs:R562e:d15u:c enote: ,field 'nthreads' will be initialized after field 'tidInBlock' nullpt r562, | & d i rteicdt(-t>iodu)t,, natrhgrse-a>dsse(nndtbhurfefa,d sa)r,g st-i>drIencBvlboucfkf(,t h r| e ^a dIdx.x), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hg:r202o:u53p:( gnote: rin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereo up), 202| | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 : 60R:u nnote: Wfield 'group' will be initialized after field 'stepSize'o rkElem e562n | t < F n ,t iTd,( tRiedd)O,p ,n tAhlrgeoa,d sP(rnotthor>e(a)d.sr)u,n (twied)I;n B l| o ^c k(thread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppI:d6x:.1x:) ,note: in instantiation of member function 'RunWork, 2, 2>::run' requested hereg roup( g6r | oIuMpP)L,_ C O| L ^~~~~~~~~~~L _FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562 :15562: | warning: initializer order does not match the declaration order [-Wreorder-ctor] tid(tid), nt h562r | e a d s (tnitdh(rteiadd)s,) ,n tthirdeIandBsl(onctkh(rtehardesa)d,I dtxi.dxI)n,B lgorcoku(pt(hgrreoaudpI)d,x . x| ) ^~~~~~~~~~~, group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hg:r562o:u15p:( gwarning: rinitializer order does not match the declaration order [-Wreorder-ctor]o up), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60 :562 | note: field 'group' will be initialized after field 'stepSize' tid( t562i | d ) , nttihdr(etaidds)(,n tnhtrheraedasd)s,( nttihdrIenaBdlso)c,k (ttihdrIenaBdlIodcxk.(xt)h,r egardoIudpx(.gxr)o,u pg)r,o u p| ( ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~g r o| u tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)p ), | ^~~~~~~~~~~ 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBca/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ st, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :202562 | : 15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] RunWorkElement< F562n | , T , tRiedd(Otpi,d )A,l gnot,h rPeraodtso(>n(t)h.rreuand(sw)e,) ;t i d| I ^n Block(th/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppr:e7a:d1I:d xnote: .in instantiation of member function 'RunWork, 2, 2>::run' requested herex ), gr o7u | pI(MgPrLo_uCpO)L,L _ F| U ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~N C (| A tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)l lReduc e563, | C O L LsNtEeTp_SDiIzReE(CnTc,c lSSIhMmPeLmE.,c oMmamx.,b uufifnSti3z2e_s[tN)C C L| _^P ROTO_S/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hI:M391P:L95E:] /note: Nexpanded from macro 'IMPL_COLL_FUNC'C CL_STEPS /391s | i z eRoufn(WTo)r)k <{n c c| l ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~F u n| c group(group# #func, type, Fu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hn:c626#:#9d:e vnote: rin instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heree dop | , N C C L _ A LpGrOi_m#s#(atligdo-,t iNdCSCtLa_rPtRSOcTaOt_t#e#rp,r ontToh>r(e)a.drsuSnc(a&tntcecrl,S hNmUeLmL.,w odrikr)e;c t\- > u| p ^, args->sen/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:b562u:f15f:, note: afield 'nthreads' will be initialized after field 'tidInBlock'r gs->recv b562u | f f , t| i ^d (tid), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hn:t202h:r53e:a dnote: sin instantiation of member function 'RunWorkElement, 2, 2>::run' requested here( nthre a202d | s ) , t i d I nRBulnoWcokr(ktEhlreemaednItd/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:)562.:r60u:n (note: wfield 'group' will be initialized after field 'stepSize'e ); | ^ 562 | t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppi:d9(:t1i:d )note: ,in instantiation of member function 'RunWork, 2, 2>::run' requested here nthre a9d | sI(MnPtLh_rCeOaLdLs_)F,U NtCi(dAIlnlBRleodcukc(et,h rCeOaLdLINdExT._xD)I,R EgCrTo,u pS(IgMrPoLuEp,) ,M a x| , ^~~~~~~~~~~ uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hI:n562B:l15o:c kwarning: (initializer order does not match the declaration order [-Wreorder-ctor]t hreadIdx.x), gr o562u | p ( g r otuipd)(,t i d| ) ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, n| t tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)h reads( n563t | h r e a dsst)e,p StiizdeI(nnBclcolcSkh(mtehmr.ecaodmImd.xb.uxf)f,S igzreosu[pN(CgCrLo_uPpR)O,T O _| S ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~I M P| L tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)E ]/NCCL _563S | T E P S /sstiezpeSoifz(eT()n)c c{l S h| m ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~e m .| c group(groupo mm.buffSizes[NC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hC:L655_:P11R:O Tnote: Oin instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here_ SIMPLE] /655N | C C L _ S T E P S / spirziemosf((tTi)d)- t{i d S| t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~a r t| R group(groupe duce, nThread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hs:R666e:d9u:c enote: ,in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here nullpt r666, | & d i r e c t -p>roiumts,( tairdg, sn-T>hsreenaddbsuGfaft,h earr,g sd-i>rreecctv-b>uufpf,, N U| L ^L , args-/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h>:s202e:n53d:b unote: fin instantiation of member function 'RunWorkElement, 2, 2>::run' requested heref , arg s202- | > r e c v b u f fR,u n W| o ^r kEleme/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hn:t202<:F53n:, note: Tin instantiation of member function 'RunWorkElement, 2, 2>::run' requested here, RedO p202, | A l g o , PRruontWoo>r(k)E.lreumne(nwte<)F;n , | T ^, RedOp,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp :A8l:g1o:, note: Pin instantiation of member function 'RunWork, 2, 2>::run' requested herer oto>( )8. | rIuMnP(Lw_eC)O;L L _| F ^U NC(AllR/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppe:d8u:c1e:, note: Cin instantiation of member function 'RunWork, 2, 2>::run' requested hereO LLNET _8D | IIRMEPCLT_,C OSLILM_PFLUEN,C (MAalxl,R eidnutc6e4,_ tC)O L L| N^E T_DIR/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hE:C391T:,95 :S Inote: Mexpanded from macro 'IMPL_COLL_FUNC'P LE, Max, 391i | n t 6R4u_ntW)o r k| <^n cclFu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hn:c391#:#95f:u nnote: cexpanded from macro 'IMPL_COLL_FUNC', type, F u391n | c # #RdeuvnrWeodrokp<u,n cN#C#CfLu_nAcL,G Ot_y#p#ea,l gFou,n cN#C#CdLe_vPrReOdToOp_<#t#yppreo>t,o >N(C)C.L_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCrL_PROToOu_p#(#gprrooutpo)>,( ) .| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~u n (| & tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)n cclShmem.work); \ 563| | ^ st/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:p562S:i15z:e (note: nfield 'nthreads' will be initialized after field 'tidInBlock'c clShme m562. | c o m m .tbiudf(ftSiidz)e,s [nNtChCrLe_aPdRsO(TnOt_hSrIeMaPdLsE)],/ NtCiCdLI_nSBTlEoPcSk/(stihzreeoafd(ITd)x). x{) , | g ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r o u| p group(group( group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ht:i677d:(11t:i dnote: )in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here, nthreads( n677t | h r e a d s ) , t ipdrIinmBsl(otcikd(-tthirdeSatdaIrdtxB.cxa)s,t ,g rnoTuhpr(egardosuBpc)a,s t ,| ^~~~~~~~~~~& direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) {/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we )562; | | ^ tid(tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp):,8 :n1t:h rnote: ein instantiation of member function 'RunWork, 2, 2>::run' requested herea ds(nt h8r | eIaMdPsL)_,C OtLiLd_IFnUBNlCo(cAkl(ltRherdeuacdeI,d xC.OxL)L,N EgTr_oDuIpR(EgCrTo,u pS)I,M P L| E ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, M| a tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)x , int6 4563_ | t ) | s^t epSize/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h(:n391c:c95l:S hnote: mexpanded from macro 'IMPL_COLL_FUNC'e m.comm.b u391f | f S iRzuensW[oNrCkC ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~, N| C group(groupC L_ALGO_##alg/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ho:,677 :N11C:C Lnote: _in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereP ROTO_##p r677o | t o > ( ) . r u n ( &pnrcicmlsS(htmiedm-.twiodrSkt)a;r t\B c a| s ^t , nThr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:a562d:s15B:c anote: sfield 'nthreads' will be initialized after field 'tidInBlock't , &dir e562c | t - > o utti,d (dtiirde)c,t -n>tdhorwena,d sa(rngtsh-r>esaednsd)b,u ftfi,d IanrBglso-c>kr(etchvrbeuafdfI,d x .| x ^) , grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hp:(202g:r53o:u pnote: )in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here, | ^~~~~~~~~~~~~~~~~ 202 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 : 60 : note: field 'group' will be initialized after field 'stepSize'R unWork E562l | e m e n tt)(,) .triudnI(nwBel)o;c k (| t ^h readIdx/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp.:x8):,1 :g rnote: oin instantiation of member function 'RunWork, 2, 2>::run' requested hereu p(gro u8p | )I,M P L| _ ^~~~~~~~~~~C OLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h), nthr:e562a:d15s:( nwarning: tinitializer order does not match the declaration order [-Wreorder-ctor]h reads), tidInBlock (562t | h r e a dtIiddx(.txi)d,) ,g rnotuhpr(egardosu(pn)t,h r e| a ^~~~~~~~~~~~~~~~~d s),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :t562i:d60I:n Bnote: lfield 'group' will be initialized after field 'stepSize'o ck(th r562e | a d I d xt.ixd)(,t igdr)o,u pn(tghrroeuapd)s,( n t| h ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~r e a| d tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)s ), tid I563n | B l o c ks(ttehprSeiazdeI(dnxc.cxl)S,h mgermo.ucpo(mgmr.obuupf)f,S i z| e ^~~~~~~~~~~s [NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::562562::1515:: warning: warning: initializer order does not match the declaration order [-Wreorder-ctor]initializer order does not match the declaration order [-Wreorder-ctor] 562 | 562 | t itdi(dt(itdi)d,) ,n tnhtrheraedasd(sn(tnhtrheraedasd)s,) ,t itdiIdnIBnlBolcokc(kt(htrheraedaIddIxd.xx.)x,) ,g rgoruopu(pg(rgoruopu)p,) , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | 563 | s tsetpeSpiSziez(en(cncclcSlhSmhemme.mc.ocmomm.mb.ubfuffSfiSziezse[sN[CNCCLC_LP_RPORTOOT_OS_ISMIPMLPEL]E/]N/CNCCLC_LS_TSETPESP/Ss/isziezoefo(fT()T)) ){ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group| group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h677::64111::11 :note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herenote: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | 641 | p rpirmism(st(itdi-dt-itdiSdSttaarrttBRceadsutc,e ,n TnhTrheraedasdBscRaesdtu,c e&,d idriercetc-t>-o>udto,w nd,i r&edcitr-e>cdto-w>no,u ta,r gasr-g>ss-e>nsdebnudfbfu,f fa,r gasr-g>sr-e>crvebcuvfbfu,f f ,| ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h53::202 :note: 53in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | 202 | R u nRWuonrWkoErlkeEmleenmtet(o)>.(r)u.nr(uwne()w;e ) ;| ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp1::8 :note: 1in instantiation of member function 'RunWork, 2, 2>::run' requested here: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | I M8P | LI_MCPOLL_LC_OFLULN_CF(UANlCl(RAeldluRceed,u cCeO,L LCNOELTL_NDEITR_EDCITR,E CSTI,M PSLIEM,P LMEa,x ,M aixn,t 6i4n_tt6)4 _ t| )^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h95::391 :note: 95expanded from macro 'IMPL_COLL_FUNC': note: expanded from macro 'IMPL_COLL_FUNC' 391 | 391R | u n WRournkW, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ype>, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:t562h:r15e:a dwarning: Iinitializer order does not match the declaration order [-Wreorder-ctor]d x.x), group(grou p562) | , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t i d| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)t id), n t563h | r e a d ss(tnetphSriezaed(sn)c,c ltSihdmIenmB.lcoocmkm(.tbhurfefaSdiIzdexs.[xN)C,C Lg_rPoRuOpT(Og_rSoIuMpP)L,E ] /| N ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~C C L| _ tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)S TEPS/s i563z | e o f ( Ts)t)e p{S i z| e ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~( n c| c group(groupl Shmem.comm.buffSizes[NCCL_PROTO_SIM/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hP:L626E:]9/:N Cnote: Cin instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereL _STEPS/ s626i | z e o f ( T ) ) p{r i m| s ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~( t i| d group(group- tidStartScatte/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hr:,626 :n9T:h rnote: ein instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herea dsScatt e626r | , N U L L , dpirriemcst(-t>iudp-,t iadrSgtsa-r>tsSecnadtbtuefrf,, naTrhgrse-a>drseSccvabtutfefr,, N| U ^L L, direct-/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h>:u202p:,53 :a rnote: gin instantiation of member function 'RunWorkElement, 2, 2>::run' requested heres ->sen d202b | u f f , a r g sR-u>nrWeocrvkbEulfefm,e n t| < ^F n, T, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hR:e202d:O53p:, note: Ain instantiation of member function 'RunWorkElement, 2, 2>::run' requested herel go, P202r | o t o > ( ) . r uRnu(nwWeo)r;k E l| e ^m ent, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Algo, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :S562I:M15P:L Ewarning: ,initializer order does not match the declaration order [-Wreorder-ctor] Max, float) | ^ 562 | tid(tid)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h,: 391n:t95h:r enote: aexpanded from macro 'IMPL_COLL_FUNC'd s(nthreads), 391t | i d IRnuBnlWoocrkk(563, | N C C Ls_tAeLpGSOi_z#e#(anlcgcol,S hNmCeCmL._cPoRmOmT.Ob_u#f#fpSriozteos>[(N)C.CrLu_nP(R&OnTcOc_lSSIhMmPeLmE.]w/oNrCkC)L;_ S\T E P| S ^/ sizeof(T)) { | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~: 562 :| 15 group(group: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 641 : 11t:i dnote: (in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heret id), nt h641r | e a d s ( n t h r e apdrsi)m,s (ttiiddI-ntBildoSctka(rtthRreedaudcIed,x .nxT)h,r egardosuRpe(dgurcoeu,p )d,i r e| c ^~~~~~~~~~~~~~~~~t ->d/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:w562n:,60 :& dnote: ifield 'group' will be initialized after field 'stepSize'r ect->o u562t | , a r gtsi-d>(steindd)b,u fnft,h raeragdss-(>nrtehcrvebaudfsf),, t| i ^d InBlock/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h(:t202h:r53e:a dnote: Iin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hered x.x), 202g | r o u p ( g r o uRpu)n,W o r| k ^~~~~~~~~~~E lement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(thread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hnote: :in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here562 :15: warning: 202initializer order does not match the declaration order [-Wreorder-ctor] | RunWorkElemen t562< | F n , Tt,i dR(etdiOdp),, Anltghor,e aPdrso(tnot>h(r)e.ardusn)(,w et)i;d I n| B ^l ock(thr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppe:a10d:I1d:x .note: xin instantiation of member function 'RunWork, 2, 2>::run' requested here) , gro u10p | (IgMrPoLu_pC)O,L L _| F ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~U N C| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)A llRedu c563e | , C O LsLtNeEpTS_iDzIeR(EnCcTc,l SShImMePmL.Ec,o mMma.xb,u fhfaSlifz)e s [| N^C CL_PRO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hT:O391_:S95I:M Pnote: Lexpanded from macro 'IMPL_COLL_FUNC'E ]/NCCL_S T391E | P S /RsuinzWeoorfk(9,: Nnote: Cin instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereC L_ALGO _666# | # a l g o , N CpCrLi_mPsR(OtTiOd_,# #npTrhorteoa>d(s)G.artuhne(r&,n cdcilrSehcmte-m>.uwpo,r kN)U;L L\, a| r ^g s->sendb/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:f562f:,15 :a rnote: gfield 'nthreads' will be initialized after field 'tidInBlock's ->recv b562u | f f , t| i ^d (tid), n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:h202r:e53a:d snote: (in instantiation of member function 'RunWorkElement, 2, 2>::run' requested heren threa d202s | ) , t i d I n BRluoncWko(rtkhErleeamdeIndtx<.Fxn),, Tg,r oRuepd(Ogpr,o uApl)g,o , | P ^~~~~~~~~~~~~~~~~r oto/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h>:(562):.60r:u nnote: (field 'group' will be initialized after field 'stepSize'w e); | ^ 562 | ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppd:(11t:i1d:) ,note: in instantiation of member function 'RunWork, 2, 2>::run' requested heren threa d11s | (InMtPhLr_eCaOdLsL)_,F UtNiCd(IAnlBllRoecdku(cteh,r eCaOdLILdNxE.Tx_)D,I RgErCoTu,p (SgIrMoPuLpE),, M a| x ^~~~~~~~~~~, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Idx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(thre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWorki,d )N,C CnLt_hArLeGaOd_s#(#natlhgroe,a dNsC)C,L _tPiRdOITnOB_l#o#cpkr(otthor>e(a)d.Irduxn.(x&)n,c cglrSohumpe(mg.rwoourpk)),; \| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | ^| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h: 562563: | 15 : note: field 'nthreads' will be initialized after field 'tidInBlock's tepSize (562n | c c l S htmiedm(.tciodm)m,. bnutfhfrSeiazdess([nNtChCrLe_aPdRsO)T,O _tSiIdMIPnLBEl]o/cNkC(CtLh_rSeTaEdPISd/xs.ixz)e,o fg(rTo)u)p ({g r o| u ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~p ) ,| group(group | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11 :562 | note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here tid(t i655d | ) , n t h r e a d sp(rnitmhsr(etaidds-)t,i dtSitdaIrntBRleodcukc(et,h rneTahdrIedaxd.sxR)e,d ugcreo,u pn(uglrloputpr),, & d| i ^~~~~~~~~~~r ect->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hR:u562n:W15o:r kwarning: (,n tNhCrCeLa_dAsL)G,O _t#i#daIlngBol,o cNkC(CtLh_rPeRaOdTIOd_x#.#xp)r,o tgor>o(u)p.(rgurno(u&pn)c,c l S| h ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~m e m| . tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)w ork); \563 | | ^ stepSize/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:n562c:c15l:S hnote: mfield 'nthreads' will be initialized after field 'tidInBlock'e m.com m562. | b u f f Stiizde(st[iNdC)C,L _nPtRhOrTeOa_dSsI(MnPtLhEr]e/aNdCsC)L,_ StTiEdPISn/Bsliozceko(ft(hTr)e)a d{I d x| . ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~x ) ,| group(groupg roup(group), | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h ^~~~~~~~~~~~~~~~~: 687:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h11::562 :note: 60in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here: note: field 'group' will be initialized after field 'stepSize' 687 | 562 | t i d ( tpirdi)m,s (nttihdr-etaiddsS(tnatrhtrBecaadsst),, ntTihdrIenaBdlsoBccka(stth,r e&addiIrdexc.tx-)>,o ugtr,o unpu(lglrpoturp,) ,a r g| s ^~~~~~~~~~~- >sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, flo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ at) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/N/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ CCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC'/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h 391: | 562 : 15R:u nwarning: Winitializer order does not match the declaration order [-Wreorder-ctor]o rkh,r eNaCdCsL)_,A LtGiOd_I#n#Ballogcok,( tNhCrCeLa_dPIRdOxT.Ox_)#,# pgrrootuop>((g)r.oruupn)(,& n c| c ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~l S h| m tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)e m.work )563; | \ | s ^t epSize/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:n562c:c15l:S hnote: mfield 'nthreads' will be initialized after field 'tidInBlock'e m.comm .562b | u f f S itzieds([tNiCdC)L,_ PnRtOhTrOe_aSdIsM(PnLtEh]r/eNaCdCsL)_,S TtEiPdSI/nsBilzoecokf((tTh)r)e a{d I d| x ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~. x )| , group(group group(group), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h| : ^~~~~~~~~~~~~~~~~677 :11:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :note: 562in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here: 60: note: field 'group' will be initialized after field 'stepSize' 677 | 562 | t i dp(rtiimds)(,t indt-htriedaSdtsa(rnttBhcraesatd,s )n,T htriedaIdnsBBlcoacskt(,t h&rdeiardeIcdtx-.>xo)u,t ,g rdoiurpe(cgtr-o>udpo)w,n , | a ^~~~~~~~~~~r gs->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | pr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~: 562 :| 15 group(group: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 562 | 655t | i d ( t i d ) , n tphrriemasd(st(indt-htriedaSdtsa)r,t RteidduIcneB,l oncTkh(rtehardesaRdeIdduxc.ex,) ,n uglrloputpr(,g r&oduipr)e,c t -| > ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~o u t| , tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) args-> s563e | n d b u fsft,e paSrigzse-(>nrcecclvSbhumfefm,. c o| m ^m .buffSi/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hz:e202s:[53N:C Cnote: Lin instantiation of member function 'RunWorkElement, 2, 2>::run' requested here_ PROTO _202S | I M P L E ] / N CRCuLn_WSoTrEkPESl/esmiezneto().run(we);/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 677| : ^11 : note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: 677in instantiation of member function 'RunWork, 2, 2>::run' requested here | 13 | I M PpLr_iCmOsL(Lt_iFdU-NtCi(dASltlaRretdBuccaes,t ,C OnLTLhNrEeTa_dDsIBRcEaCsTt,, S&IdMiPrLeEc,t -M>aoxu,t ,r cdcilr_ebcftl-o>adto1w6n), a| r^g s->s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:n391d:b95u:f fnote: ,expanded from macro 'IMPL_COLL_FUNC' args->r e391c | v b uRfufn,W o r| k ^< ncclFunc#/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h#:f202u:n53c:, note: tin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herey pe, F u202n | c # # d e v r e dRoupnl,e mNeCnCtL<_FAnL,G OT_,# #RaeldgOop,, NAClCgLo_,P RPOrToOt_o#>#(p)r.ortuon>((w)e.)r;u n (| & ^n cclShm/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cppe:m13.:w1o:r knote: )in instantiation of member function 'RunWork, 2, 2>::run' requested here; \ | ^13 | IMPL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h_:C562O:L15L:_ Fnote: Ufield 'nthreads' will be initialized after field 'tidInBlock'N C(AllR e562d | u c e , tCiOdL(LtNiEdT)_,D InRtEhCrTe,a dSsI(MnPtLhEr,e aMdasx),, rtcicdlI_nbBflloocakt(1t6h)r e a| d^I dx.x),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :g391r:o95u:p (note: gexpanded from macro 'IMPL_COLL_FUNC'r oup), | ^~~~~~~~~~~~~~~~~391 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hR:u562n:W60o:r knote: ), N| C^C L_ALGO_##algo, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hN:C391C:L95_:P Rnote: Oexpanded from macro 'IMPL_COLL_FUNC'T O_##proto>( )391. | r u nR(u&nnWcocrlkS | , N C CtLi_dA(LtGiOd_)#,# anltghor,e aNdCsC(Ln_tPhRrOeTaOd_s#)#,p rtoitdoI>n(B)l.orcukn((t&hnrcecaldSIhdmxe.mx.)w,o rgkr)o;u p\( g r| o ^u p), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h562::56260::15 :note: field 'group' will be initialized after field 'stepSize'note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | 562 | t i d (ttiidd()t,i dn)t,h rnetahdrse(andtsh(rnetahdrse)a,d st)i,d ItniBdlIoncBkl(otchkr(etahdrIedaxd.Ixd)x,. xg)r,o ugpr(ogurpo(ugpr)o,u p )| , ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::562391::1595:: warning: note: initializer order does not match the declaration order [-Wreorder-ctor]expanded from macro 'IMPL_COLL_FUNC' 391 | R562u | n W o r kt, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :391562 | : 15 :R uwarning: ninitializer order does not match the declaration order [-Wreorder-ctor]W orka,d sN)C,C Lt_iAdLIGnOB_l#o#cakl(gtoh,r eNaCdCILd_xP.RxO)T,O _g#r#opurpo(tgor>o(u)p.)r,u n (| & ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~n c c| l tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)S hmem.w o563r | k ) ; \s t e| p ^S ize(ncclS/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hh:m562e:m15.:c onote: mfield 'nthreads' will be initialized after field 'tidInBlock'm .buffSiz e562s | [ N C C Lt_iPdR(OtTiOd_)S,I MnPtLhEr]e/aNdCsC(Ln_tShTrEePaSd/ss)i,z etoifd(ITn)B)l o{c k (| t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~h r e| a group(groupd Idx.x), group(gr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ho:u655p:)11,: note: | in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562: 60655: | note: field 'group' will be initialized after field 'stepSize' 562p | r i m s (ttiidd(-ttiidd)S,t anrtthRreedaudcse(,n tnhTrheraedasd)s,R etdiudcIen,B lnouclkl(ptthrr,e a&ddIidrxe.cxt)-,> ogurto,u pa(rggrso-u>ps)e,n d b| u ^~~~~~~~~~~f f, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :n562t:h15r:e awarning: dinitializer order does not match the declaration order [-Wreorder-ctor]s (nthreads), tidI n562B | l o c k (ttihdr(etaiddI)d,x .nxt)h,r egardosu(pn(tghrroeuapd)s,) , | t ^~~~~~~~~~~~~~~~~i dIn/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hB:l562o:c60k:( tnote: hfield 'group' will be initialized after field 'stepSize'r eadIdx .562x | ) , g rtoiudp((tgirdo)u,p )n,t h r| e ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~a d s| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)n threads )563, | t i d IsntBelpoScikz(et(hnrcecaldSIhdmxe.mx.)c,o mgmr.obuupf(fgSriozueps)[,N C C| L ^~~~~~~~~~~_ PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx940. 67 warnings generated when compiling for gfx908. 67 warnings generated when compiling for gfx900. 67 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartRe/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:u562c:e15,: nwarning: Tinitializer order does not match the declaration order [-Wreorder-ctor]h readsReduce, nullp t562r | , & d itriedc(tt-i>do)u,t ,n tahrrgesa-d>ss(enndtbhurfefa,d sa)r,g st-i>drIencBvlboucfkf(,t h r| e ^a dIdx.x),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :g202:r53o:u pnote: (in instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereg roup) ,202 | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) RunWo r563k | E l e m esnttei(z)e.sr[uNnC(CwLe_)P;R O T| O ^_ SIMPLE]/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp/:N8C:C1L:_ Snote: Tin instantiation of member function 'RunWork, 2, 2>::run' requested hereE PS/si z8e | oIfM(PTL)_)C O{L L _| F ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~U N C| ( group(groupA llReduce, COLLNET_DIREC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hT:,677 :S11I:M Pnote: Lin instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereE , Max, i n677t | 6 4 _ t ) | ^ prims/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h(:t391i:d95-:t inote: dexpanded from macro 'IMPL_COLL_FUNC'S tartBcas t391, | n TRhurneWaodrskB,o utty,p ed,i rFeucntc-#>#ddoewvnr,e daorpgpsee>n,d bNuCfCfL,_ AaLrGgOs_-#>#raelcgvob,u fNfC,C L _| P ^R OTO_##pr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hot:o202>:(53):. rnote: uin instantiation of member function 'RunWorkElement, 2, 2>::run' requested heren (&ncc l202S | h m e m . w o r kR)u;n W\o r k| E ^l ement/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h<:F562n:,15 :T ,note: field 'nthreads' will be initialized after field 'tidInBlock'R edOp, A562l | g o , Ptriodt(ot>i(d)).,r unnt(hwree)a;d s (| n ^t hreads),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp :t7i:d1I:n Bnote: lin instantiation of member function 'RunWork, 2, 2>::run' requested hereo ck(th r7eadIdx.x) | ,I MgPrLo_uCpO(LgLr_ouFpU)N,C ( A| l ^~~~~~~~~~~~~~~~~l Red/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:c562e:,60 :C Onote: Lfield 'group' will be initialized after field 'stepSize'L NET_DI R562E | C T , StIiMdP(LtEi,d )M,a xn,t hurienatd3s2(_ntt)h r e| a^d s), t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hi:d391I:n95B:l onote: cexpanded from macro 'IMPL_COLL_FUNC'k (threadI d391x | . x )R,u ngWroorukp<(ngcrcoluFpu)n,c # #| f ^~~~~~~~~~~u nc, type, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMP/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL:_562C:O15L:L _warning: Finitializer order does not match the declaration order [-Wreorder-ctor]U NC(AllReduce, 562C | O L L N EtTi_dD(ItRiEdC)T,, nStIhMrPeLaEd,s (Mnatxh,r efaldosa)t,) t i| d^I nBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for host. 67 warnings generated when compiling for gfx1102. 67 warnings generated when compiling for gfx90a. 67 warnings generated when compiling for gfx1101. 67 warnings generated when compiling for gfx1030. 67 warnings generated when compiling for gfx1100. 67 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h :| ^~~~~514 :9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), ntIn file included from h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppr:e1a: dIn file included from s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h(:n10t: hIn file included from r/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.he:a167d: s)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h,: 562t:i15d:I nwarning: Blinitializer order does not match the declaration order [-Wreorder-ctor]o ck(threadIdx.x), grou p562( | g r o u pt)i,d ( t| i ^~~~~~~~~~~~~~~~~d ), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:t562h:r60e:a dnote: sfield 'group' will be initialized after field 'stepSize'( nthrea d562s | ) , t itdiIdn(Btliodc)k,( tnhtrheraedaIddsx(.nxt)h,r egardosu)p,( gtrioduIpn)B,l o c| k ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~( t h| r tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)e adIdx. x563) | , g r osutpe(pgSriozuep()n,c c l| S ^~~~~~~~~~~h mem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hi:d626):,9 :n tnote: hin instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herer eads(nth r626e | a d s ) , t i dpIrniBmlso(ctki(dt-htriedaSdtIadrxt.Sxc)a,t tgerro,u pn(Tghrroeuapd)s,S c a| t ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t e r| , tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) NULL, d i563r | e c t - >sutpe,p Sairzges(-n>cscelnSdhbmuefmf.,c oamrmg.sb-u>frfeScivzbeusf[fN,C C L| _ ^P ROTO_SIMP/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hL:E202]:/53N:C Cnote: Lin instantiation of member function 'RunWorkElement, 2, 2>::run' requested here_ STEPS/ s202i | z e o f ( T ) ) R{u n W| o ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r k E| l group(groupe ment, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereg o, Prot o626> | ( ) . r u n ( w ep)r;i m s| ( ^t id-tidSta/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppr:t4S:c1a:t tnote: ein instantiation of member function 'RunWork, 2, 2>::run' requested herer , nTh r4e | aIdMsPSLc_aCtOtLeLr_,F UNNUCL(LA,l ldRierdeuccte-,> uCpO,L LaNrEgTs_-D>IsReEnCdTb,u fSfI,M PaLrEg,s -P>rreeMcuvlbSuufmf,, i n| t ^8 _t) | ^/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :202:53: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hnote: :in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here391 :95: note: expanded from macro 'IMPL_COLL_FUNC'202 | R391u | n W oRruknEWloermked(e)v.rreudno(pw| , ^ NCCL_AL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppG:O5_:#1#:a lnote: gin instantiation of member function 'RunWork, 2, 2>::run' requested hereo , NCC L5_ | PIRMOPTLO__C#O#LpLr_oFtUoN>C(()A.lrluRne(d&unccec,l SChOmLeLmN.EwTo_rDkI)R;E C\T , | S ^I MPLE, Pr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:M562u:l15S:u mnote: ,field 'nthreads' will be initialized after field 'tidInBlock' uint8_ t562) | | ^ tid(ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hd:)391,: 95n:t hnote: rexpanded from macro 'IMPL_COLL_FUNC'e ads(nthre a391d | s ) ,R utniWdoIrnkB:,60 :N Cnote: Cfield 'group' will be initialized after field 'stepSize'L _ALGO_ #562# | a l g o ,t iNdC(CtLi_dP)R,O TnOt_h#r#epardost(on>t(h)r.eraudns()&,n ctcildSIhnmBelmo.cwko(rtkh)r;e a\d I d| x ^. x), g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:o562u:p15(:g rnote: ofield 'nthreads' will be initialized after field 'tidInBlock'u p), | ^~~~~~~~~~~562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562562 | : 15 : warning: tinitializer order does not match the declaration order [-Wreorder-ctor]i d(tid), nthre a562d | s ( n t htrieda(dtsi)d,) ,t indtIhnrBelaodcsk((ntthhrreeaaddIsd)x,. xt)i,d IgnrBoluopc(kg(rtohurpe)a,d I d| x ^~~~~~~~~~~ .x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::202562::5315:: note: warning: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereinitializer order does not match the declaration order [-Wreorder-ctor] 202 | 562R | u n W o rtkiEdl(etmiedn)t,< Fnnt,h rTe,a dRse(dnOtph,r eAaldgso),, PtriodtIon>B(l)o.crku(nt(hwree)a;d I d| x ^. x), group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp(:g5r:o1u:p )note: ,in instantiation of member function 'RunWork, 2, 2>::run' requested here | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)5 | IMPL_ C563O | L L _ F UsNtCe(pASlilzRee(dnucccel,S hCmOeLmL.NcEoTm_mD.IbRuEfCfTS,i zSeIsM[PNLCEC,L _PPrReOMTuOl_SSuImM,P LuEi]n/tN8C_CtL)_ S T| E^P S/sizeo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hf:(391T:)95): {note: expanded from macro 'IMPL_COLL_FUNC' | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 391 | RunWor/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hk:<626n:c9c:l Fnote: uin instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heren c##func ,626 | t y p e , F u npcr#i#mdse(vtriedd-otpit,S cNaCtCtLe_rA,L GnOT_h#r#eaaldgsoS,c aNtCtCeLr_,P RNOUTLOL_,# #dpirroetcot>-(>)u.pr,u na(r&gnsc-c>lsSehnmdebmu.fwfo,r ka)r;g s\- > r| e ^c vbuff, | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h ^: 562:15: note: field 'nthreads' will be initialized after field 'tidInBlock'/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here562 | t202i | d ( t i d ) , nRtuhnrWeoardksE(lnetmhernetax()),. rgurno(uwpe()g;r o u| p ^) , | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::5562::160:: note: note: in instantiation of member function 'RunWork, 2, 2>::run' requested herefield 'group' will be initialized after field 'stepSize' 5 | 562I | M P L _ CtOiLdL(_tFiUdN)C,( AnltlhRreedaudcse(,n tChOrLeLaNdEsT)_,D ItRiEdCITn,B lSoIcMkP(LtEh,r ePardeIMduxl.Sxu)m,, gurionutp8(_gtr)o u p| )^, | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hp:(562g:r15o:u pwarning: )initializer order does not match the declaration order [-Wreorder-ctor], | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUN/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsRe 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groupC(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ (| A tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)l lReduce ,563 | C O L L NsEtTe_pDSIiRzEeC(Tn,c cSlISMhPmLeEm,. cPormemM.ubluSfufmS,i zienst[3N2C_CtL)_ P R| O^T O_SIMPLE]/NCCL_STEP/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hS:/391s:i95z:e onote: fexpanded from macro 'IMPL_COLL_FUNC'( T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 391 | RunWork, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herec , type, F641u | n c # # d e v r e d oppri,d -NtCiCdLS_tAaLrGtOR_e#d#uacleg,o ,n TNhCrCeLa_dPsRORTeOd_u#c#ep,r odtior>e(c)t.-r>udno(w&nn,c c&ldSihrmeecmt.-w>oorukt),; a\r g s| - ^> sendbuff, args->r/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:c562v:b15u:f fnote: ,field 'nthreads' will be initialized after field 'tidInBlock' | ^ 562/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h | : 202 : 53 :t inote: din instantiation of member function 'RunWorkElement, 2, 2>::run' requested here( tid), 202 | n t h r e a d s (RnutnhWroerakdEsl)e,m etnitdp(()g.rrouunp()w,e ) ;| ^~~~~~~~~~~~~~~~~ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp::605:: 1note: :field 'group' will be initialized after field 'stepSize' note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 562 | 5 | I MtPiLd_(CtOiLdL)_,F UnNtCh(rAelaldRse(dnutcher,e aCdOsL)L,N EtTi_dDIInRBElCoTc,k (StIhMrPeLaEd,I dPxr.exM)u,l Sgurmo,u upi(ngtr8o_utp)) , | ^| ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ duce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsB/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, P/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ idInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hNCCL_A:L562G:O15_:# #warning: alinitializer order does not match the declaration order [-Wreorder-ctor]g o, NCCL_PROTO_##proto>().r u562n | ( & n c ctliSdh(mteimd.)w,o rnkt)h;r e\a d s| ( ^n threads), tidInBlock(threadI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:x562.:x15):, note: gfield 'nthreads' will be initialized after field 'tidInBlock'r oup(group), 562| | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)t id(tid )563, | n t h rsetaedpsS(inzteh(rnecacdlsS)h,m etmi.dcIonmBml.obcukf(ftShirzeeasd[INdCxC.Lx_)P,R OgTrOo_uSpI(MgPrLoEu]p/)N,C C L| _ ^~~~~~~~~~~~~~~~~S TEP/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hS:/562s:i60z:e onote: ffield 'group' will be initialized after field 'stepSize'( T)) { 562| | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(groupt id(tid), nthreads(nthreads), t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hi:d687I:n11B:l onote: cin instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herek (thread I687d | x . x ) , g r o u pp(rgirmosu(pt)i,d - t| i ^~~~~~~~~~~d StartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_P_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IM/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ PL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidSta/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rtBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##pr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h 562: | 562 : 15 : twarning: iinitializer order does not match the declaration order [-Wreorder-ctor]d (tid), nthreads(nthre a562d | s ) , ttiiddI(ntBliodc)k,( tnhtrheraedaIddsx(.nxt)h,r egardosu)p,( gtrioduIpn)B,l o c| k ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~( t h| r tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)e adIdx.x )563, | g r o uspt(egprSoiuzpe)(,n c c| l ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~S h m| e tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)m .comm. b563u | f fS i z esst[eNpCSCiLz_eP(RnOcTcOl_SShImMePmL.Ec]o/mNmC.CbLu_fSfTSEiPzSe/ss[iNzCeCoLf_(PTR)O)T O{_ S| I ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~M P L| E group(group] /NCCL_STEPS/sizeof(T)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h): 655{: 11 :| note: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here | group(group 655 | prims(tid-/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ht:i655d:S11t:a rnote: tin instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereR educe, n655T | h r e a d s R e d u cper,i mnsu(ltlipdt-rt,i d&SdtiarretcRte-d>uocuet,, naTrhgrse-a>dsseRneddbuucfef,, naurlglsp-t>rr,e c&vdbiurfefc,t - >| o ^u t, args-/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h>:s202e:n53d:b unote: fin instantiation of member function 'RunWorkElement, 2, 2>::run' requested heref , arg s202- | > r e c v b u f fR,u n W| o ^r kElement, 2, 2>::run' requested heree dOp, A202l | g o , P r o t oR>u(n)W.orruknE(lweem)e;n t , 2, 2>::run' requested hereo , Pro t7o | >I(M)P.Lr_uCnO(LwLe_)F;U N C| ( ^A llReduce/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp,: 7C:O1L:L Nnote: Ein instantiation of member function 'RunWork, 2, 2>::run' requested hereT _DIRE C7T | ,I MSPILM_PCLOEL,L _PFrUeNMCu(lASlulmR,e duuicnet,3 2C_OtL)L N E| T^_ DIRECT/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h,: 391S:I95M: Pnote: Lexpanded from macro 'IMPL_COLL_FUNC'E , PreMul S391u | m , RuuinnWto3r2k_n,c cNlCFCuLn_cA#L#GfOu_n#c#,a ltgyop,e ,N CFCuLn_cP#R#OdTeOv_r#e#dporpop(e)>.,r uNnC(C&Ln_cAcLlGSOh_m#e#ma.lwgoor,k )N;C C\L _ P| R ^O TO_##p/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:o562t:o15>:( )note: .field 'nthreads' will be initialized after field 'tidInBlock'r un(&nc c562l | S h m e mt.iwdo(rtki)d;) ,\ n t| h ^r eads(n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:h562r:e15a:d snote: )field 'nthreads' will be initialized after field 'tidInBlock', tidIn B562l | o c k ( tthirde(atdiIdd)x,. xn)t,h rgeraodusp((ngtrhoruepa)d,s ) ,| ^~~~~~~~~~~~~~~~~t idI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:B562l:o60c:k (note: tfield 'group' will be initialized after field 'stepSize'h readId x562. | x ) , gtriodu(pt(igdr)o,u pn)t,h r e| a ^~~~~~~~~~~~~~~~~d s(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:t562h:r60e:a dnote: sfield 'group' will be initialized after field 'stepSize') , tidI n562B | l o c k (ttihdr(etaiddI)d,x .nxt)h,r egardosu(pn(tghrroeuapd)s,) , | t ^~~~~~~~~~~i dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h-:ti562d:S15t:a rwarning: tinitializer order does not match the declaration order [-Wreorder-ctor]B cast, nThread s562B | c a s t ,t i&dd(itriedc)t,- >notuhtr,e andusl(lnptthrr,e aadrsg)s,- >tsiednIdnbBulfofc,k (atrhgrse-a>drIedcxv.bxu)f,f ,g r o| u ^p (group),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 202| : ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~53 : | note: tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202563 | | s t e pRSuinzWeo(rnkcEclleSmhemnetm<.Fcno,m mT.,b uRfefdSOipz,e sA[lNgCoC,L _PPrRoOtToO>_(S)I.MrPuLnE(]w/eN)C;C L _| S ^T EPS/size/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppo:f7(:T1):) note: {in instantiation of member function 'RunWork, 2, 2>::run' requested here | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | 7 group(group | IMPL_COLL_FUNC(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hA:l677l:R11e:d unote: cin instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heree , COLLNE T677_ | D I R E C T , S I MpPrLiEm,s (PtriedM-utliSduSmt,a rutiBncta3s2t_,t )n T h| r^e adsBca/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hs:t391,: 95&:d inote: rexpanded from macro 'IMPL_COLL_FUNC'e ct->out, 391d | i r eRcutn-W>odrokw#s#efnudnbcu,f ft,y paer,g sF-u>nrce#c#vdbeuvfrfe,d o p| < ^t ype>, NC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hC:L202_:A53L:G Onote: _in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here# #algo ,202 | N C C L _ P R O TROu_n#W#oprrkoEtloe>m(e)n.tr ().run/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:w562e:)15;: note: | field 'nthreads' will be initialized after field 'tidInBlock' ^ 562/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp | : 7 : 1 :t inote: din instantiation of member function 'RunWork, 2, 2>::run' requested here( tid), 7n | tIhMrPeLa_dCsO(LnLt_hFrUeNaCd(sA)l,l RteidduIcneB,l oCcOkL(LtNhErTe_aDdIIRdExC.Tx,) ,S IgMrPoLuEp,( gPrroeuMpu)l,S u m| , ^~~~~~~~~~~~~~~~~ uin/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:35622:_60t:) note: field 'group' will be initialized after field 'stepSize'| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h562: | 391 : 95 : tnote: iexpanded from macro 'IMPL_COLL_FUNC'd (tid), n t391h | r e aRdusn(Wnotrhkrp,) ,N C C| L ^~~~~~~~~~~_ ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Fn, T, RedOp, Algo, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ >().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h641::56211::15 :note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herewarning: initializer order does not match the declaration order [-Wreorder-ctor] 641 | p r562i | m s ( t itdi-dt(itdiSdt)a,r tnRtehdruecaed,s (nnTthhrreeaaddssR)e,d utcied,I ndBilroecckt(-t>hdroewand,I d&xd.ixr)e,c tg-r>oouupt(,g raorugps)-,> s e| n ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~d b u| f tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)f , args -563> | r e c v bsutfefp,S i z| e ^( ncclShm/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:m202.:c53o:m mnote: .in instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereb uffSi z202e | s [ N C C L _ P RROuTnOW_oSrIkMEPlLeEm]e/nNtC (| ) group(group. run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp::6559::111:: note: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herein instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | 655I | M P L _ C O L L _ F UpNrCi(mAsl(ltRiedd-utcied,S tCaOrLtLRNeEdTu_cDeI,R EnCTTh,r eSaIdMsPRLeEd,u cPer,e MnuullSlupmt,r ,u i&ndti6r4e_ctt)- > o| u^t , args-/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h>:s391e:n95d:b unote: fexpanded from macro 'IMPL_COLL_FUNC'f , args-> r391e | c v bRuufnfW,o r k| < ^n cclFunc#/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h#:f202u:n53c:, note: tin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herey pe, F u202n | c # # d e v r e dRoupnl,e mNeCnCtL<_FAnL,G OT_,# #RaeldgOop,, NAClCgLo_,P RPOrToOt_o#>#(p)r.ortuon>((w)e.)r;u n (| & ^n cclShmem/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.:w9o:r1k:) ;note: in instantiation of member function 'RunWork, 2, 2>::run' requested here\ | ^ 9 | IMP/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL:_562C:O15L:L _note: Ffield 'nthreads' will be initialized after field 'tidInBlock'U NC(All R562e | d u c e ,t iCdO(LtLiNdE)T,_ DnItRhErCeTa,d sS(InMtPhLrEe,a dPsr)e,M utliSduImn,B luoicnkt(6t4h_rte)a d I| d^x .x), g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:o391u:p95(:g rnote: oexpanded from macro 'IMPL_COLL_FUNC'u p), | ^~~~~~~~~~~~~~~~~ 391 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562R:u60n:W onote: rfield 'group' will be initialized after field 'stepSize'k t,i dNICnCBLl_oAcLkG(Ot_h#r#eaaldgIod,x .NxC)C,L _gPrRoOuTpO(_g#r#opurpo)t,o > (| ) ^~~~~~~~~~~. run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hou:p562):,15 : | warning: ^~~~~~~~~~~~~~~~~initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | 562 | t itdi(dt(itdi)d),, nntthhrreeaaddss((nntthhrreeaaddss)),, tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hhr:e562a:d15s:) ,warning: initializer order does not match the declaration order [-Wreorder-ctor]t idInBlock(thre a562d | I d x . xt)i,d (gtriodu)p,( gnrtohurpe)a,d s (| n ^~~~~~~~~~~t hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(Al/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ Algo, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ype, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBloc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hk:(t562h:r15e:a dwarning: Iinitializer order does not match the declaration order [-Wreorder-ctor]d x.x), group(g r562o | u p ) , t i| d ^~~~~~~~~~~( tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hwe); | : ^562 :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1 :562 | note: in instantiation of member function 'RunWork, 2, 2>::run' requested here tid(ti d9) | ,I MnPtLh_rCeOaLdLs_(FnUtNhCr(eAaldlsR)e,d utcied,I nCBOlLoLcNkE(Tt_hDrIeRaEdCITd,x .SxI)M,P LgEr,o uPpr(egMruoluSpu)m,, u| i ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~n t 6| 4 tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)_ t) | ^ 563 | ste/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hp:S391i:z95e:( nnote: cexpanded from macro 'IMPL_COLL_FUNC'c lShmem.co m391m | . b uRfufnSWiozreks<[nNcCcClLF_uPnRcO#T#Of_uSnIcM,P LtEy]p/eN,C CFLu_nScT#E#PdSe/vsriezdeoopf<(tTy)p)e >{, N| C ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~C L _| A group(groupL GO_##algo, NCCL_PROTO_##/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hp:r626o:t9o:> (note: )in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here. run(&nc c626l | S h m e m . w o rpkr)i;m s\( t i| d ^- tidStart/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hS:c562a:t15t:e rnote: ,field 'nthreads' will be initialized after field 'tidInBlock' nThreads S562c | a t t e rt,i dN(UtLiLd,) ,d inrtehcrte-a>dusp(,n tahrrgesa-d>ss)e,n dtbiudfIfn,B laorcgks(-t>hrreecavdbIudfxf.,x ) ,| ^g roup(grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hp:)202,: 53 :| ^~~~~~~~~~~~~~~~~note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562: 60202: | note: field 'group' will be initialized after field 'stepSize' R u562n | W o r k Etliedm(etnitd<)F,n ,n tTh,r eRaeddsO(pn,t hArlegaod,s )P,r ottiod>I(n)B.lroucnk((wteh)r;e a d| I ^d x.x), g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppr:o10u:p1(:g rnote: oin instantiation of member function 'RunWork, 2, 2>::run' requested hereu p), | 10 ^~~~~~~~~~~ | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROT/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ O_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.bu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hf:f562S:i15z:e swarning: [initializer order does not match the declaration order [-Wreorder-ctor]N CCL_PROTO_SIMPLE]/N C562C | L _ S T EtPiSd/(stiizde)o,f (nTt)h)r e{a d s| ( ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~n t h| r group(groupe ads), tidInBlock(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hh:r641e:a11d:I dnote: xin instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here. x), grou p641( | g r o u p ) , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~p r i| m tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)s (tid-t i563d | S t a r tsRteedpuSciez,e (nnTchcrleSahdmseRme.dcuocmem,. bduifrfeScitz-e>sd[oNwCnC,L _&PdRiOrTeOc_tS-I>MoPuLtE,] /aNrCgCsL-_>SsTeEnPdSb/usfifz,e oafr(gTs)-)> r{e c v| b ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~u f f| , group(group | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :677:11: 202note: | in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here R677u | n W o r k E l e m e nptrr(e)a.drsuBnc(awset),; & d| i ^r ect->ou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppt:,11 :d1i:r enote: cin instantiation of member function 'RunWork, 2, 2>::run' requested heret ->dow n11, | IaMrPgLs_-C>OsLeLn_dFbUuNfCf(,A lalrRgesd-u>cree,c vCbOuLfLfN,E T _| D ^I RECT, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hS:I202M:P53L:E ,note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereP reMul S202u | m , f l o a t )R u n| W^orkElement:(95):. rnote: uexpanded from macro 'IMPL_COLL_FUNC'n (we); | ^391 | RunW/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppo:r10k:<1n:c cnote: lin instantiation of member function 'RunWork, 2, 2>::run' requested hereF unc## f10u | nIcM,P Lt_yCpOeL,L _FFuUnNcC#(#AdlelvRreedduocpe<,t yCpOeL>L,N ENTC_CDLI_RAELCGTO,_ #S#IaMlPgLoE,, NPCrCeLM_uPlRSOuTmO,_ #h#aplrfo)t o >| (^) .run(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h&:n391c:c95l:S hnote: mexpanded from macro 'IMPL_COLL_FUNC'e m.work) ;391 | \ R| u ^n Workn,t hNrCeCaLd_sA)L,G Ot_i#d#IanlBgloo,c kN(CtChLr_ePaRdOITdOx_.#x#)p,r ogtroo>u(p)(.grruonu(p&)n,c c l| S ^~~~~~~~~~~~~~~~~h mem/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h.:w562o:r60k:) ;note: field 'group' will be initialized after field 'stepSize'\ | ^ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562t:i15d:( tnote: ifield 'nthreads' will be initialized after field 'tidInBlock'd ), nth r562e | a d s ( nttihdr(etaidds)),, nttihdrIenaBdlso(cnkt(htrheraedasd)I,d xt.ixd)I,n Bglroocukp((tghrroeuapd)I,d x .| x ^~~~~~~~~~~) , group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p, Algo, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthrea/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:s562(:n15t:h rwarning: einitializer order does not match the declaration order [-Wreorder-ctor]a ds), tidInBlock(th r562e | a d I d xt.ixd)(,t igdr)o,u pn(tghrroeuapd)s,( n t| h ^~~~~~~~~~~~~~~~~r ea/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:s562):,60 tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSi/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ze(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/size/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ of(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.htepSize(:n562c:c15l:S hwarning: minitializer order does not match the declaration order [-Wreorder-ctor]e m.comm.buffSizes[NCCL_PRO T562O | _ S I M PtLiEd](/tNiCdC)L,_ SnTtEhPrSe/asdisz(enotfh(rTe)a)d s{) , | t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~i d I| n group(groupB lock(threadIdx.x), group(group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h):,641 : 11| : ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | 641 | s t e p S i z e ( n cpcrliSmhsm(etmi.dc-otmimd.SbtuafrftSRiezdeusc[eN,C CnLT_hPrReOaTdOs_RSeIdMuPcLeE,] /dNiCrCeLc_tS-T>EdPoSw/ns,i z&edoifr(eTc)t)- >{o u t| , ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ a r| g group(groups ->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :note: 202in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here: 53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 666 | 202 | p r i m s (RtuindW,o rnkTEhlreemaednstGAulpg,o ,N UPLrLo,t oa>r(g)s.-r>usne(nwdeb)u;f f ,| ^a rgs->recv/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppb:u10f:f1,: note: | in instantiation of member function 'RunWork, 2, 2>::run' requested here ^ 10 | IM/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hP:L202_:C53O:L Lnote: _in instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereF UNC(A l202l | R e d u c e , CROuLnLWNoErTk_EDlIeRmEeCnTt,< FSnI,M PTL,E ,R ePdrOepM,u lASlugmo,, hParloft)o > (| )^. run(we)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h;: 391 :| 95 ^: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11: 1391: | note: in instantiation of member function 'RunWork, 2, 2>::run' requested hereR unWor k11< | nIcMcPlLF_uCnOcL#L#f_uFnUcN,C (tAylpleR,e dFuucnec,# #CdOeLvLrNeEdTo_pD,, SNICMCPLL_EA,L GPOr_e#M#uallSguom,, NfClCoLa_tP)R O T| O^_ ##proto/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h>:(391):.95r:u nnote: (expanded from macro 'IMPL_COLL_FUNC'& ncclShme m391. | w o rRku)n;W o\r k <| n ^c clFunc##f/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:n562c:,15 :t ynote: pfield 'nthreads' will be initialized after field 'tidInBlock'e , Func# #562d | e v r e dtoipd<(ttyipde)>,, nNtChCrLe_aAdLsG(On_t#h#raelagdos,) ,N CtCiLd_IPnRBOlToOc_k#(#tphrroetaod>I(d)x..rxu)n,( &gnrcoculpS(hgmreomu.pw)o,r k )| ; ^~~~~~~~~~~~~~~~~ \ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h| : ^562 :60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562 :56215 | : note: field 'nthreads' will be initialized after field 'tidInBlock' tid(ti d562) | , n t htrieda(dtsi(dn)t,h rnetahdrse)a,d st(indtIhnrBelaodcsk)(,t htriedaIdnIBdlxo.cxk)(,t hgrreoaudpI(dgxr.oxu)p,) ,g r o| u ^~~~~~~~~~~p (group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nc##func, type, Func##devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hreads), :ti562d:I15n:B lwarning: ocinitializer order does not match the declaration order [-Wreorder-ctor]k (threadIdx.x), group( g562r | o u p ) ,t i d| ( ^~~~~~~~~~~t id), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(thre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h,: 562| : ^15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | 562 | RtuindW(otrikdE)l,e mnetnhtr((t)h.rreuand(Iwdex).;x ) ,| ^g roup(gr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppo:u12p:)1,: note: | in instantiation of member function 'RunWork, 2, 2>::run' requested here ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 12 | I563M | P L _ C OsLtLe_pFSUiNzCe((AnlclcRleSdhumceem,. cCoOmLmL.NbEuTf_fDSIiRzEeCsT[,N CSCILM_PPLREO,T OP_rSeIMMuPlLSEu]m/,N CdCoLu_bSlTeE)P S /| s^i zeof(T/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h):)391 :{95 : | note: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~expanded from macro 'IMPL_COLL_FUNC' | group(group 391 | RunWork, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herec , type, 626F | u n c # # d e v rperdiomps<(ttyipde->t,i dNSCtCaLr_tASLcGaOt_t#e#ra,l gnoT,h rNeCaCdLs_SPcaRtOtTeOr_,# #NpUrLoLt,o >d(i)r.ercutn-(>&unpc,c laSrhgmse-m>.sweonrdkb)u;f f\, a| r ^g s->re/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hc:v562b:u15f:f ,note: field 'nthreads' will be initialized after field 'tidInBlock' | ^ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 202 :t53i:d (note: tin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herei d), n t202h | r e a d s ( n t hRruenaWdosr)k,E lteimdeInntBr(o)u.pr)u,n ( w| e ^~~~~~~~~~~~~~~~~) ; /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h| : ^562 :60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1 :562 | note: in instantiation of member function 'RunWork, 2, 2>::run' requested here tid( t13i | dI)M,P Ln_tChOrLeLa_dFsU(NnCt(hArlelaRdesd)u,c et,i dCIOnLBLlNoEcTk_(DtIhRrEeCaTd,I dSxI.MxP)L,E ,g rPoruepM(uglrSouump,) ,r c c| l ^~~~~~~~~~~_ bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h NC:C562L:_15P:R Owarning: TO_##protoinitializer order does not match the declaration order [-Wreorder-ctor]> ().run(&ncclShmem. w562o | r k ) ; t\i d (| t ^i d), nthreads(nthreads), t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hi:d562I:n15B:l onote: cfield 'nthreads' will be initialized after field 'tidInBlock'k (threadIdx.x), g r562o | u p ( g rtoiudp()t,i d )| , ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ n t| h tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)r eads(n t563h | r e a d ss)t,e ptSiidzIen(BnlcocclkS(htmherme.acdoImdmx..bxu)f,f Sgirzoeusp[(NgCrCoLu_pP)R,O T O| _ ^~~~~~~~~~~~~~~~~S IMP/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL:E562]:/60N:C Cnote: Lfield 'group' will be initialized after field 'stepSize'_ STEPS/ s562i | z e o f (tTi)d)( t{i d )| , ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ n t| h group(groupr eads(nthreads), ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hd:I677n:B11l:o cnote: kin instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here( threadId x677. | x ) , g r o u p ( gprroiumps)(,t i d| - ^~~~~~~~~~~t idStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h 641 | : 562 : 15 : warning: pinitializer order does not match the declaration order [-Wreorder-ctor]r ims(tid-tidStartRed u562c | e , n Tthirde(atdisdR)e,d uncteh,r edaidrse(cntt-h>rdeoawdns,) ,& dtiirdeIcntB-l>oocukt(,t harregasd-I>dsxe.nxd)b,u fgfr,o uapr(ggsr-o>urpe)c,v b u| f ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~f , | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)| ^ 563 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 202 : 53s:t enote: pin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereS ize( n202c | c l S h m e m . cRoumnmW.obrukfEflSeimzeenst[E(P)S./rsuinz(ewoef)(;T ) )| ^{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp group(group: 13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hC:O666L:L9_:F Unote: Nin instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereC (AllRe d666u | c e , C O L L NpErTi_mDsI(RtEiCdT,, nSTIhMrPeLaEd,s GPartehMeurl,S udmi,r ercctc-l>_ubpf,l oNaUtL1L6,) a r| g^s ->sen/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hd:b391u:f95f:, note: aexpanded from macro 'IMPL_COLL_FUNC'r gs->rec v391b | u f fR,u n W| o ^r k, 2, 2>::run' requested here, type ,202 | F u n c # # d e vRruendWoopre,n tNO(_)#.#rpurno(twoe>)(;) . r| u ^n (&nccl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppS:h12m:e1m:. wnote: oin instantiation of member function 'RunWork, 2, 2>::run' requested herer k); \ 12 | | I ^M PL_CO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL:L562_:F15U:N Cnote: (field 'nthreads' will be initialized after field 'tidInBlock'A llRedu c562e | , C O LtLiNdE(Tt_iDdI)R,E CnTt,h rSeIaMdPsL(En,t hPrreeaMdusl)S,u mt,i ddIonuBblloec)k ( t| h^r eadIdx/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h.:x391):,95 :g rnote: oexpanded from macro 'IMPL_COLL_FUNC'u p(group) ,391 | | ^~~~~~~~~~~~~~~~~R unW/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:r562k:<60n:c cnote: lfield 'group' will be initialized after field 'stepSize'F unc## f562u | n c , ttyipde(,t iFdu)n,c #n#tdherveraeddso(pnd,s )N,C CtLi_dAILnGBOl_o#c#ka(ltghor,e aNdCICdLx_.PxR)O,T Og_r#o#uppr(ogtroo>u(p)).,r u n| ( ^~~~~~~~~~~& ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBca/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ st, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthrea/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:s562):,15 :t iwarning: dinitializer order does not match the declaration order [-Wreorder-ctor]I nBlock(threadI d562x | . x ) , tgirdo(utpi(dg)r,o unpt)h,r e a| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~s ( n| t tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)h reads) ,563 | t i d I nsBtleopcSki(zteh(rnecacdlISdhxm.exm).,c ogmrmo.ubpu(fgfrSoiuzpe)s,[ N C| C ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~L _ P| R tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)O TO_SIM P563L | E ] / N CsCtLe_pSSTiEzPeS(/nsciczleSohfm(eTm).)c o{m m .| b ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~u f f| S group(groupi zes[NCCL_PROTO_S/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hI:M677P:L11E:] /note: Nin instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereC CL_STEP S677/ | s i z e o f ( T ) ) p{r i m| s ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~( t i| d group(group- tidStartBcast,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :n677T:h11r:e anote: din instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heres Bcast, &677d | i r e c t - > o u t ,p rdiimrse(ctti-d>-dtoiwdnS,t aarrtgBsc-a>sste,n dnbTuhfrfe,a dasrBgcsa-s>tr,e c&vdbiurfefc,t - >| o ^u t, dir/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:c202t:-53>:d onote: win instantiation of member function 'RunWorkElement, 2, 2>::run' requested heren , arg s202- | > s e n d b u f fR,u naWrogrsk-E>lreemcevnbtu, 2, 2>::run' requested herer oto>( )202. | r u n ( w e ) ; R u| n ^W orkElem/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppe:n12t:<1F:n ,note: in instantiation of member function 'RunWork, 2, 2>::run' requested hereT , Red O12p | ,I MAPlLg_oC,O LPLr_oFtUoN>C(()A.lrluRne(dwuec)e;, C| O ^L LNET_DI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppR:E13C:T1,: Snote: Iin instantiation of member function 'RunWork, 2, 2>::run' requested hereM PLE, P13r | eIMMuPlLS_uCmO,L Ld_oFuUbNlCe()A l l| R^e duce,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :C391O:L95L:N Enote: Texpanded from macro 'IMPL_COLL_FUNC'_ DIRECT, 391S | I M PRLuEn,W oPrrke, NCCL _391A | L G OR_u#n#Waolrgko<,n cNcClCFLu_nPcR#O#TfOu_n#c#,p rtoytpoe>,( )F.urnucn#(#&dnecvcrleSdhompek,) ;N C\C L _| A ^L GO_##a/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hl:g562o:,15 :N Cnote: Cfield 'nthreads' will be initialized after field 'tidInBlock'L _PROTO _562# | # p r o ttoi>d(()t.irdu)n,( &nntchcrleSahdmse(mn.twhorreka)d;s )\, t| i ^d InBlo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hc:k562(:t15h:r enote: afield 'nthreads' will be initialized after field 'tidInBlock'd Idx.x) ,562 | g r o u pt(igdr(otuipd)),, n| t ^~~~~~~~~~~~~~~~~h rea/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:s562(:n60t:h rnote: efield 'group' will be initialized after field 'stepSize'a ds), t i562d | I n B l otcikd((tthirde)a,d Indtxh.rxe)a,d sg(rnotuhpr(egardosu)p,) ,t i d| I ^~~~~~~~~~~~~~~~~n Blo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hc:k562(:t60h:r enote: afield 'group' will be initialized after field 'stepSize'd Idx.x )562, | g r o utpi(dg(rtoiudp)),, n t| h ^~~~~~~~~~~r eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h53::562 :note: 15in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here: warning: initializer order does not match the declaration order [-Wreorder-ctor] 202 | Ru n562W | o r k E lteimde(nttii(d)I.nrBulno(cwke()t;h r e| a ^d Idx.x), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppg:r13o:u1p:( gnote: rin instantiation of member function 'RunWork, 2, 2>::run' requested hereo up), | 13 ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | I M| P tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)L _COLL_ F563U | N C ( A lsltReepdSuiczee,( nCcOcLlLSNhEmTe_mD.IcRoEmCmT.,b uSfIfMSPiLzEe,s [PNrCeCMLu_lPSRuOmT,O _rScIcMlP_LbEf]l/oNaCtC1L6_)S T E| P^S /sizeof/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h(:T391):)95 :{ note: expanded from macro 'IMPL_COLL_FUNC'| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 391 | RunWork, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herey pe, Func #655# | d e v r e d o p < t ypprei>m,s (NtCiCdL-_tAiLdGSOt_a#r#taRlegdou,c eN,C CnLT_hPrReOaTdOs_R#e#dpurcoet,o >n(u)l.lrputnr(,& n&cdcilrSehcmte-m>.owuotr,k )a;r g\s - >| s ^e ndbuff, a/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:g562s:-15>:r enote: cfield 'nthreads' will be initialized after field 'tidInBlock'v buff, | 562 ^ | tid(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:i202d:)53,: nnote: tin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereh reads (202n | t h r e a d s ) ,R utniWdoIrnkBElloecmke(ntth (| ) ^~~~~~~~~~~~~~~~~. run/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:w562e:)60;: note: | field 'group' will be initialized after field 'stepSize' ^ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp : 13 :t1i:d (note: tin instantiation of member function 'RunWork, 2, 2>::run' requested herei d), nt h13r | eIaMdPsL(_nCtOhLrLe_aFdUsN)C,( AtlildRIendBulcoec,k (CtOhLrLeNaEdTI_dDxI.RxE)C,T ,g rSoIuMpP(LgEr,o uPpr)e,M u l| S ^~~~~~~~~~~u m, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h| : ^391 :95: note: expanded from macro 'IMPL_COLL_FUNC'/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp :12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12391 | | I M PRLu_nCWOoLrLk_e,M uNlCSCuLm_,A LdGoOu_b#l#ea)l g o| ,^ NCCL_P/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hR:O391T:O95_:# #note: pexpanded from macro 'IMPL_COLL_FUNC'r oto>().r u391n | ( & nRcucnlWSohrmke, NCC L562_ | A L G O _t#i#da(ltgiod,) ,N CnCtLh_rPeRaOdTsO(_n#t#hprreoatdos>)(,) .triudnI(n&BnlcocclkS(htmherme.awdoIrdkx).;x )\, g| r ^o up(gro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:p562):,15 : | note: ^~~~~~~~~~~~~~~~~field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562: 60562: | note: field 'group' will be initialized after field 'stepSize' tid(t i562d | ) , n tthirde(atdisd()n,t hnrtehardesa)d,s (tnitdhIrneBaldosc)k,( tthirdeIandBIldoxc.kx()t,h rgeraoduIpd(xg.rxo)u,p )g,r o u| p ^~~~~~~~~~~~~~~~~( gro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:p562):,60 : | note: ^~~~~~~~~~~field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(thr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::562202::1553:: warning: note: initializer order does not match the declaration order [-Wreorder-ctor]in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | Ru n562W | o r k E lteimde(nttid(I)n.Brluonc(kw(et)h;r e a| d ^I dx.x), g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppr:o13u:p1(:g rnote: oin instantiation of member function 'RunWork, 2, 2>::run' requested hereu p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~13 | I| M tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)P L_COLL _563F | U N C ( AsltleRpeSdiuzcee(,n cCcOlLSLhNmEeTm_.DcIoRmEmC.Tb,u fSfISMiPzLeEs,[ NPCrCeLM_uPlRSOuTmO,_ SrIcMcPlL_Eb]f/lNoCaCtL1_6S)T E P| S^/ sizeof(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hT:)391): 95:{ note: expanded from macro 'IMPL_COLL_FUNC'| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 391 | RunWork, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heref unc, ty p655e | , F u n c # # d e vprreidmosp(i,d SNtCaCrLt_RAeLdGuOc_e#,# anlgToh,r eNaCdCsLR_ePdRuOcTeO,_ #n#uplrlopttor>,( )&.druinr(e&cntc-c>loSuhtm,e ma.rwgosr-k>)s;e n\d b u| f ^f , args->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:e562c:v15b:u fnote: ffield 'nthreads' will be initialized after field 'tidInBlock', | ^ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :t202i:d53(:t inote: din instantiation of member function 'RunWorkElement, 2, 2>::run' requested here) , nth r202e | a d s ( n t h r eRaudnsW)o,r ktEildeImneBnltou(p)).,r u n| ( ^~~~~~~~~~~~~~~~~w e);/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : | ^ 562:60: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cppnote: :field 'group' will be initialized after field 'stepSize'13 :1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 562 | 13t | iIdM(PtLi_dC)O,L Ln_tFhUrNeCa(dAsl(lnRtehdruecaed,s )C,O LtLiNdEITnB_lDoIcRkE(CtTh,r eSaIdMIPdLxE.,x )P,r egMruoluSpu(mg,r orucpc)l,_ b f| l ^~~~~~~~~~~o at16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h::562655::1511:: warning: note: initializer order does not match the declaration order [-Wreorder-ctor]in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | p562r | i m s ( ttiidd-(ttiiddS)t,a rnttRherdeuacdes,( nntThhrreeaaddss)R,e dtuicdeI,n Bnluolclkp(ttrh,r e&addiIrdexc.tx-)>,o ugtr,o uapr(ggsr-o>uspe)n,d b u| f ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~f , | a tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)r gs->re c563v | b u f f ,s t e| p ^S ize(nccl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hS:h202m:e53m:. cnote: oin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herem m.buf f202S | i z e s [ N C C LR_uPnRWOoTrOk_ESlIeMmPeLnEt] (| ) ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~. r u| n group(group( we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :note: 626in instantiation of member function 'RunWork, 2, 2>::run' requested here: 9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 13 | IMPL_ C626O | L L _ F U N C ( AplrliRmesd(utcied,- tCiOdLSLtNaErTt_SDcIaRtECtTe,r ,S InMTPhLrEe,a dPsrSecMautltSeurm,, NrUcLcLl,_ bdfilroeactt1-6>)u p ,| ^a rgs->s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:n391d:b95:u fnote: fexpanded from macro 'IMPL_COLL_FUNC', args-> r391 | e c vRbuunfWfo,r k <| n ^c clFunc#/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h#:f202u:n53c:, note: tin instantiation of member function 'RunWorkElement, 2, 2>::run' requested herey pe, F u202n | c # # d e v r e dRoupnl,e mNeCnCtL<_FAnL,G OT_,# #RaeldgOop,, NAClCgLo_,P RPOrToOt_o#>#(p)r.ortuon>((w)e.)r;u n (| & ^n cclShmem/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.:w13o:r1k:) ;note: in instantiation of member function 'RunWork, 2, 2>::run' requested here\ | ^ 13 | IMP/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL:_562C:O15L:L _note: Ffield 'nthreads' will be initialized after field 'tidInBlock'U NC(All R562e | d u c e ,t iCdO(LtLiNdE)T,_ DnItRhErCeTa,d sS(InMtPhLrEe,a dPsr)e,M utliSduImn,B lroccckl(_tbhfrleoaadtI1d6x). x )| ,^ group(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hg:r391o:u95p:) ,note: expanded from macro 'IMPL_COLL_FUNC' | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h: 562391: | 60 : Rnote: ufield 'group' will be initialized after field 'stepSize'n 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Work, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562 655: | 15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] prims(tid -562t | i d S t atid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rtReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx908. 67 warnings generated when compiling for gfx940. 67 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ck(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for host. 67 warnings generated when compiling for gfx90a. 67 warnings generated when compiling for gfx906. 67 warnings generated when compiling for gfx1030. 67 warnings generated when compiling for gfx1100. 67 warnings generated when compiling for gfx803. 67 warnings generated when compiling for gfx1101. 67 warnings generated when compiling for gfx900. 67 warnings generated when compiling for gfx1102. 67 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, intIn file included from 8_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppt:)1 : In file included from | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h^: 10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h167:: 391/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::95562:: 15note: :expanded from macro 'IMPL_COLL_FUNC' warning: initializer order does not match the declaration order [-Wreorder-ctor] 391 | RunWork <562n | c c l F utnicd#(#tfiudn)c,, nttyhpree,a dFsu(nnct#h#rdeeavdrse)d,o ptl,o cNkC(CtLh_rAeLaGdOI_d#x#.axl)g,o ,g rNoCuCpL(_gPrRoOuTpO)_,# # p| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~o t o| > tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)( ).run( &563n | c c l S hsmteemp.Swiozrek()n;c c\l S h| m ^e m.com/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hm:.562b:u15f:f Snote: ifield 'nthreads' will be initialized after field 'tidInBlock'z es[NCC L562_ | P R O T Ot_iSdI(MtPiLdE)],/ NnCtChLr_eSaTdEsP(Sn/tshirzeeaodfs()T,) )t i{d I n| B ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~l o c| k group(group( threadIdx.x), grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hp:(626g:r9o:u pnote: )in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here, | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h626: | 562 : 60 : note: field 'group' will be initialized after field 'stepSize' prim s562( | t i d - ttiiddS(ttairdt)S,c antttherre,a dnsT(hnrtehardesaSdcsa)t,t etri,d INnUBLlLo,c kd(itrherceta-d>Iudpx,. xa)r,g sg-r>osuepn(dgbruofufp,) ,a r g| s ^~~~~~~~~~~- >recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_S/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | pTrims(tiEdP-St/isdiSzteaorft(BTc)a)s t{, n| T ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~h r e| a group(groupd sBcast, &direct->out, nullptr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h,: 677a:r11g:s -note: >in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heres endbuff, ar g677s | - > r e c v b u f f ,p r i| m ^s (tid-tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hS:t202a:r53t:B cnote: ain instantiation of member function 'RunWorkElement, 2, 2>::run' requested heres t, nT h202r | e a d s B c a s tR,u n&WdoirrkeEclte-m>eonutt<,F nd,i rTe,c tR-e>ddOopw,n ,A lagrog,s -P>rsoetnod>b(u)f.fr,u na(rwges)-;> r e| c ^v buff, | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp ^: 4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53 :4 | note: Iin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereM PL_COL L202_ | F U N C ( A l l RReudnuWcoer,k EClOeLmLeNnEtT<_FDnI,R ETC,T ,R eSdIOMpP,L EA,l gMoi,n ,P riontto8>_(t)). r u| n^( we); /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h| : ^391 :95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: 391in instantiation of member function 'RunWork, 2, 2>::run' requested here | Run W4o | rIkMM,P LNEC,C LM_iAnL,G Oi_n#t#8a_ltg)o , | N^C CL_PROT/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hO:_391#:#95p:r onote: texpanded from macro 'IMPL_COLL_FUNC'o >().run( &391n | c c lRSuhnmWeomr.kwt,i dN)C,C Ln_tAhLrGeOa_d#s#(anltghor,e aNdCsC)L,_ PtRiOdTIOn_B#l#opcrko(ttoh>r(e)a.drIudnx(.&xn)c,c lgSrhomuepm(.gwroorukp));, \ | ^~~~~~~~~~~~~~~~~| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hnote: :field 'group' will be initialized after field 'stepSize'562 :15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | t i562d | ( t i d )t,i dn(tthirde)a,d sn(tnhtrheraedasd(sn)t,h rteiaddIsn)B,l otcikd(ItnhBrleoacdkI(dtxh.rxe)a,d Igdrxo.uxp)(,g rgoruopu)p,( g r| o ^~~~~~~~~~~u p), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&nc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ clShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:n562t:h15r:e awarning: dinitializer order does not match the declaration order [-Wreorder-ctor]s ), tidInBlock(t h562r | e a d I dtxi.dx()t,i dg)r,o unpt(hgrreoaudps)(,n t h| r ^~~~~~~~~~~e ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:t562i:d15-:t iwarning: dinitializer order does not match the declaration order [-Wreorder-ctor]S tartBcast, nT h562r | e a d s Btciads(tt,i d&)d,i rnetchtr-e>aodust(,n tdhirreeacdts-)>,d otwind,I naBrlgosc-k>(stehnrdebaudfIfd,x .axr)g,s -gr>oruepc(vgbruofufp,) , | ^| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202: 53563: | note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here step S202i | z e ( n c c l S hRmuenmW.ocrokmEml.ebmuefnftSC(L)_.SrTuEnP(Sw/es)i;z e o| f ^( T)) { | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~: 4 :| 1 group(group: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IM/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hP:L677_:C11O:L Lnote: _in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereFU NC(AllRe d677u | c e , C O L L N E Tp_rDiImRsE(CtTi,d -StIiMdPSLtEa,r tMBicna,s ti,n tn8T_htr)e a d| s^B cast,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :&391d:i95r:e cnote: texpanded from macro 'IMPL_COLL_FUNC'- >out, di r391e | c t -R>udnoWwonr,k usnecn#d#bfuufnfc,, atrygpse-,> rFeucnvcb#u#fdfe,v r e| d ^o p/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h,: 202N:C53C:L _note: Ain instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereL GO_## a202l | g o , N C C L _RPuRnOWToOr_k#E#lpermoetnot><(F)n.,r uTn,( &RnecdcOlpS,h mAelmg.ow,o rPkr)o;t o\> ( )| . ^r un(we/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h):;562 : 15| : ^ note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4: 1562: | note: in instantiation of member function 'RunWork, 2, 2>::run' requested here tid (4t | iIdM)P,L _nCtOhLrLe_aFdUsN(Cn(tAhlrleRaeddsu)c,e ,t iCdOILnLBNlEoTc_kD(IthRrEeCaTd,I dSxI.MxP)L,E ,g rMoiunp,( girnot8u_pt)), | | ^ ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::562391::6095:: note: note: field 'group' will be initialized after field 'stepSize'expanded from macro 'IMPL_COLL_FUNC' 562 | 391t | i d (RtuindW)o,r kn,, gNrCoCuLp_(AgLrGoOu_p#)#,a l g| o ^~~~~~~~~~~, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSize/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hs:[562N:C15C:L _warning: Pinitializer order does not match the declaration order [-Wreorder-ctor]R OTO_SIMPLE]/NC C562 | L _ S T EtPiSd/(stiizde)o,f (nTt)h)r e{a d s| ( ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~n t h| r group(groupe ads), tidInBl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ho:c626k:(9t:h rnote: ein instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herea dIdx.x) ,626 | g r o u p ( g r opurpi)m,s ( t| i ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~d - t| i tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)d StartS c563a | t t e r ,s tneTphSriezaed(snScccaltSthemre,m .NcUoLmLm,. bduifrfeScitz-e>su[pN,C CaLr_gPsR-O>TsOe_nSdIbMuPfLfE,] /aNrCgCsL-_>SrTeEcPvSb/usfifz,e o f| ( ^T )) { | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~: 202 :| 53 group(group: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :R641u:11n:W onote: rin instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herek Element< F641n | , T , R e d O p ,p rAilmgso(,t iPdr-ottiod>S(t)a.rrtuRne(dwuec)e;, n| T ^h readsRed/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppu:c5e:,1 :d inote: rin instantiation of member function 'RunWork, 2, 2>::run' requested heree ct->d o5w | nI,M P&Ld_iCrOeLcLt_-F>UoNuCt(,A lalrRgesd-u>csee,n dCbOuLfLfN,E Ta_rDgIsR-E>CrTe,c vSbIuMfPfL,E , | M ^i n, uint8/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h_:t202): 53 :| ^note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :202391 | : 95 : note: expanded from macro 'IMPL_COLL_FUNC' RunWor k391E | l e mReunntWF(u)n.cr#u#nd(ewver)e; d o| p ^< type>, N/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppC:C5L:_1A:L Gnote: Oin instantiation of member function 'RunWork, 2, 2>::run' requested here_ ##alg o5, | INMCPCLL__CPORLOLT_OF_U#N#Cp(roto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h):,562 :g15r:o uwarning: pinitializer order does not match the declaration order [-Wreorder-ctor]( group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562562 | : 60 : note: tfield 'group' will be initialized after field 'stepSize'i d(tid) ,562 | n t h r etaidds((tnitdh)r,e andtsh)r,e atdisd(InntBhlroecakd(st)h,r etaiddIIdnxB.lxo)c,k (gtrhoruepa(dgIrdoxu.px)),, g| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~o u p| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)g roup), 563 | | ^~~~~~~~~~~ stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ #devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h]:/562N:C15C:L _warning: Sinitializer order does not match the declaration order [-Wreorder-ctor]T EPS/sizeof(T)) 562{ | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ t i| d group(group( tid), nthrea/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hd:s677(:n11t:h rnote: ein instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herea ds), ti d677I | n B l o c k(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)562 :15: warning: initializer order does not match the declaration order [-Wreorder-ctor]563 | stepSize(ncclSh m562e | m . c o mtmi.db(utfifdS)i,z enst[hNrCeCaLd_sP(RnOtThOr_eSaIdMsP)L,E ]t/iNdCICnLB_lSoTcEkP(St/hsriezaedoIfd(xT.)x)) ,{ g r| o ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~u p (| g group(groupr oup), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :687:11 :563 | note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here stepS i687z | e ( n c c l S h m e mp.rciommsm(.tbiudf-ftSiidzSetsa[rNtCBCcLa_sPtR,O TnOT_hSrIeMaPdLsEB]c/aNsCtC,L _&SdTiErPeSc/ts-i>zoeuotf,( Tn)u)l l{p t r| , ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ a r| g group(groups ->sendbuff, args->rec/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hv:b677u:f11f:, note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h677: | 202 : 53 : note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here p r202i | m s ( t i d - t iRduSntWaorrtkBEclaesmte,n tnootuot>,( )d.irruenc(tw-e>)d;o w n| , ^ args->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpps:e5n:d1b:u fnote: fin instantiation of member function 'RunWork, 2, 2>::run' requested here, args -5> | rIeMcPvLb_uCfOfL,L _ F| U ^N C(AllR/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:d202u:c53e:, note: Cin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereO LLNE T202_ | D I R E C T , SRIuMnPWLoEr,k EMlienm,e nuti().run (391w | e ) ;R u n| W ^o rk, 2, 2>::run' requested herec , typ e5, | IFMuPnLc_#CO#LdLe_vFrUeNdCo(pAu,c eN,C CCLO_LALLNGEOT__#D#IaRlEgCoT,, NSCICMLP_LPER,O TMOi_n#,# puriontto8>_(t)). r u| n^( &nccl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hS:h391m:e95m:. wnote: oexpanded from macro 'IMPL_COLL_FUNC'r k); \ | ^391 | Ru/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:W562o:r15k:< nnote: cfield 'nthreads' will be initialized after field 'tidInBlock'c lFunc# #562f | u n c , ttiydp(et,i dF)u,n cn#t#hdreevardesd(onpts,) ,N CtCiLd_IAnLBGlOo_c#k#(atlhgroe,a dNICdCxL._xP)R,O TgOr_o#u#pp(rgortoou>p()),. r u| n ^~~~~~~~~~~~~~~~~( &nc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hc:l562S:h60m:e mnote: .field 'group' will be initialized after field 'stepSize'w ork); 562\ | | ^ tid(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hi:d562):,15 :n tnote: hfield 'nthreads' will be initialized after field 'tidInBlock'r eads(n t562h | r e a d st)i,d (ttiiddI)n,B lnotchkr(etahdrse(andtIhdrxe.axd)s,) ,g rtoiudpI(ngBrlooucpk)(,t h r| e ^~~~~~~~~~~a dIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 :p15r:i mwarning: sinitializer order does not match the declaration order [-Wreorder-ctor]( tid-tidStartBc a562s | t , n Tthirde(atdisdB)c,a sntt,h r&edaidrse(cntt-h>roeuatd,s )n,u ltlipdtIrn,Bl oacrkg(st-h>rseeanddIbduxf.fx,) ,a rggrso-u>pr(egcrvobuupf)f,, | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ ^ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h: 202563: | 53 : note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested heres tepSi z202e | ( n c c l S h m eRmu.ncWoomrmk.EbluefmfeSnitz_(S)T.ErPuSn/(swiez)e;o f (| T ^) ) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp :| 5 group(group: 1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hM:P666L:_9C:O Lnote: Lin instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here_ FUNC(A l666l | R e d u c e , CpOrLiLmNsE(T_tDiIdR,E CnTT,h rSeIaMdPsLGEa,t hMeirn,, duiirnetc8t_-t>)u p ,| ^N ULL, ar/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hg:s391-:>95s:e nnote: dexpanded from macro 'IMPL_COLL_FUNC'b uff, arg s391- | > r eRcuvnbWuofrfk,< n c| c ^l Func##f/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hu:n202c,: 53t:y pnote: ein instantiation of member function 'RunWorkElement, 2, 2>::run' requested here, Func #202# | d e v r e d o p r,k ENlCeCmL_eAnLtGt(o)>.(r)u.nr(uwne()&;n c c| l ^S hmem.wo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppr:k5):;1 :\ note: in instantiation of member function 'RunWork, 2, 2>::run' requested here | ^ 5 | IMPL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hC:O562L:L15_:F Unote: Nfield 'nthreads' will be initialized after field 'tidInBlock'C (AllRed u562c | e , C OtLiLdN(EtTi_dD)I,R EnCtTh,r eSaIdMsP(LnEt,h rMeiand,s )u,i ntti8d_Itn)B l o| c^k (thre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ha:d391I:d95x:. xnote: )expanded from macro 'IMPL_COLL_FUNC', group(g r391o | u p )R,u n W| o ^~~~~~~~~~~~~~~~~r kn,t hNrCeCaLd_sA)L,G Ot_i#d#IanlBgloo,c kN(CtChLr_ePaRdOITdOx_.#x#)p,r ogtroo>u(p)(.grruonu(p&)n,c c l| S ^~~~~~~~~~~h mem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.homm.buff:S562i:z15e:s [warning: Ninitializer order does not match the declaration order [-Wreorder-ctor]C CL_PROTO_SIMPLE]/NCCL_ S562T | E P S / stiizde(otfi(dT)),) n{t h r| e ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~a d s| ( group(groupn threads), tidInBlock(threadI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hd:x687.:x11):, note: gin instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herer oup(group) ,687 | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) pri m563s | ( t i d -sttiedpSStiazret(BnccacsltS,h mneTmh.rceoamdms.BbcuafsftS,i z&edsi[rNeCcCtL-_>PoRuOtT,O _nSuIlMlPpLtEr],/ NaCrCgLs_-S>TsEePnSd/bsuifzfe,o fa(rTg)s)- >{r e c| v ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~b u f| f group(group, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9 :202 | note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here Ru n626W | o r k E l e m e nptrT(h)r.eraudns(Swcea)t;t e r| , ^ NULL, d/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppi:r5e:c1t:- >note: uin instantiation of member function 'RunWork, 2, 2>::run' requested herep , arg s5- | >IsMePnLd_bCuOfLfL,_ FaUrNgCs(-A>lrleRcevdbuucfef,, C O| L ^L NET_DIRE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hC:T202,: 53S:I Mnote: Pin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereL E, Mi n202, | u i n t 8 _ t )R u n| W^o rkElem/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:n391t:<95F:n ,note: expanded from macro 'IMPL_COLL_FUNC'T , RedOp ,391 | A l gRou,n WPorroktc(c)l.Fruunnc(#w#ef)u;n c ,| ^t ype, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppF:u7n:c1#:# dnote: ein instantiation of member function 'RunWork, 2, 2>::run' requested herev redop <7t | yIpMeP>L,_ CNOCLCLL__FAULNGCO(_A#l#laRlegdou,c eN,C CCLO_LPLRNOETTO__D#I#RpErCoTt,o >S(I)M.PrLuEn,( &Mnicnc,l Suhimnetm3.2w_otr)k ) ;| ^\ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hnote: :expanded from macro 'IMPL_COLL_FUNC'562 :15: note: field 'nthreads' will be initialized after field 'tidInBlock' 391 | Ru n562W | o r k < ntcicdl(Ftuindc)#,# fnutnhcr,e atdysp(en,t hFruenacd#s#)d,e vtrieddIonpBt,h rNeCaCdLI_dAxL.GxO), gro_u#p#(aglrgoou,p )N,C C L| _ ^~~~~~~~~~~~~~~~~P ROT/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hO:_562#:#60p:r onote: tfield 'group' will be initialized after field 'stepSize'o >().ru n562( | & n c c ltSihdm(etmi.dw)o,r kn)t;h r\e a d| s ^( nthreads/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h):,562 :t15i:d Inote: nfield 'nthreads' will be initialized after field 'tidInBlock'B lock(t h562r | e a d I dtxi.dx()t,i dg)r,o unpt(hgrreoaudps)(,n t h| r ^~~~~~~~~~~e ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElemen/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ht:<626F:n9,: Tnote: , in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereR edOp, Algo, Pro t626o | > ( ) . r u n ( wper)i;m s (| t ^i d-tidSt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppa:r6t:S1c:a tnote: tin instantiation of member function 'RunWork, 2, 2>::run' requested heree r, nT h6r | eIaMdPsLS_cCaOtLtLe_rF,U NNCU(LALl,l Rdeidrueccet,- >CuOpL,L NaErTg_sD-I>RsEeCnTd,b uSfIfM,P LaEr,g sM-i>nr,e civnbtu3f2f_,t ) | ^| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: 391in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here | RunW o202r | k < n c c l F u nRcu#n#WfournkcE,l etmyepnet,< FFnu,n cT#,# dReevdrOepd,o pAP,r oNtCoC>L(_)A.LrGuOn_(#w#ea)l;g o ,| ^N CCL_PROT/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppO:_7#:#1p:r onote: tin instantiation of member function 'RunWork, 2, 2>::run' requested hereo >().r u7 | nI(M&PnLc_cClOSLhLm_eFmU.NwCo(rAkl)l;R e\d u c| e ^, COLLN/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hE:T562_:D15I:R Enote: Cfield 'nthreads' will be initialized after field 'tidInBlock'T , SIMP L562E | , M itni,d (utiindt)3,2 _ntt)h r e| a^d s(nthre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ha:d391s:)95,: tnote: iexpanded from macro 'IMPL_COLL_FUNC'd InBlock( t391h | r e aRduIndWxo.rxk)<,n cgcrloFuupn(cg#r#ofuupn)c,, t| y ^~~~~~~~~~~~~~~~~p e, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hF:u562n:c60#:# dnote: efield 'group' will be initialized after field 'stepSize'v redop< t562y | p e > , tNiCdC(Lt_iAdL)G,O _n#t#harlegaod,s (NnCtChLr_ePaRdOsT)O, _t#i#dpIrnoBtloo>c(k)(.trhurne(a&dIndcxc.lxS)h,m egmr.owuopr(kg)r;o u\p ) ,| ^ | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hg:r562o:u15p:) ,warning: initializer order does not match the declaration order [-Wreorder-ctor] | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nTh/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hreadsGat:h562e:r15,: dwarning: iinitializer order does not match the declaration order [-Wreorder-ctor]r ect->up, NULL, args->s e562n | d b u f ft,i da(rtgisd-)>,r enctvhbruefafd,s ( n| t ^h reads),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :t202i:d53I:n Bnote: lin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hereo ck(th r202e | a d I d x . x ) ,R ugnrWoourpk(Eglreomuepn)t,< F n| , ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ T ,| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)R edOp, A563l | g o , PsrtoetpoS>i(z)e.(rnucnc(lwSeh)m;e m .| c ^o mm.buf/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppf:S7i:z1e:s [note: Nin instantiation of member function 'RunWork, 2, 2>::run' requested hereC CL_PR O7T | OI_MSPILM_PCLOEL]L/_NFCUCNLC_(SATlElPRSe/dsuiczee,o fC(OTL)L)N E{T _ D| I ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~R E C| T group(group, SIMPLE, Min, uint32_t) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :| 641^: 11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :391:95: note: expanded from macro 'IMPL_COLL_FUNC' 641 | 391 | RpurniWmosr(kt>,d oNwCnC,L _&AdLiGrOe_c#t#-a>loguot,, NaCrCgLs_-P>RsOeTnOd_b#u#fpfr,o taor>g(s)-.>rruenc(v&bnucfcfl,S h m| e ^m .work); /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h\: 202 :| 53 ^: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562: 15202: | note: field 'nthreads' will be initialized after field 'tidInBlock' R u562n | W o r k Etliedm(etnitd<)F,n ,n tTh,r eRaeddsO(pn,t hArlegaod,s )P,r ottiod>I(n)B.lroucnk((wteh)r;e a d| I ^d x.x), g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppr:o6u:p1(:g rnote: oin instantiation of member function 'RunWork, 2, 2>::run' requested hereu p), | 6 ^~~~~~~~~~~~~~~~~ | IMP/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL:_562C:O60L:L _note: Ffield 'group' will be initialized after field 'stepSize'U NC(Al l562R | e d u c et,i dC(OtLiLdN)E,T _nDtIhRrEeCaTd,s (SnItMhPrLeEa,d sM)i,n ,t iidnItn3B2l_otc)k ( t| h^r eadId/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hx:.391x:)95,: gnote: rexpanded from macro 'IMPL_COLL_FUNC'o up(grou p391) | , R| u ^~~~~~~~~~~n Work, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h t:i562d:(15t:i dwarning: )initializer order does not match the declaration order [-Wreorder-ctor], nthreads(nthreads), ti d562I | n B l o ctki(dt(htrieda)d,I dnxt.hxr)e,a dgsr(onutph(rgeraodusp)),, t i| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~I n B| l tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)o ck(t h563r | e a d I dsxt.exp)S,i zger(onucpc(lgSrhomuepm).,c o m| m ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~. b u| f tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)f Sizes[ N563C | C L _ P RsOtTeOp_SSiIzMeP(LnEc]c/lNSChCmLe_mS.TcEoPmSm/.sbiuzfefoSfi(zTe)s)[ N{C C L| _ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~P R O| T group(groupO _SIMPLE]/NCCL_STEPS/size/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ho:f687(:T11):) note: {in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 687 | prims(tid-t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hi:d677S:t11a:r tnote: Bin instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herec ast, nTh r677e | a d s B c a s t , &pdriirmesc(tt-i>do-utti,d SntualrltpBtcra,s ta,r gnsT-h>rseeanddsbBucfafs,t ,a r&gdsi-r>ercetc-v>bouuftf,, d i| r ^e ct->down,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :a202r:g53s:- >note: sin instantiation of member function 'RunWorkElement, 2, 2>::run' requested heree ndbuf f202, | a r g s - > r eRcuvnbWuofrfk,E l e| m ^e nt, 2, 2>::run' requested here Algo, 202P | r o t o > ( ) . rRuunn(Wwoer)k;E l e| m ^e nt, 2, 2>::run' requested here Algo, 6P | rIoMtPoL>_(C)O.LrLu_nF(UwNeC)(;A l l| R ^e duce, CO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppL:L6N:E1T:_ Dnote: Iin instantiation of member function 'RunWork, 2, 2>::run' requested hereR ECT, S6I | MIPMLPEL,_ CMOiLnL,_ FiUnNtC3(2A_ltl)R e d| u^c e, COL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hL:N391E:T95_:D Inote: Rexpanded from macro 'IMPL_COLL_FUNC'E CT, SIM P391L | E , RMuinnW,o riknW,o rNkC#(d)e.vrruend(o&pnm,e mN.CwCoLr_kA)L;G O\_ # #| a ^l go, NCCL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h_:P562R:O15T:O _note: #field 'nthreads' will be initialized after field 'tidInBlock'# proto> (562) | . r u n (t&indc(ctliSdh)m,e mn.twhorreka)d;s (\n t h| r ^e ads), ti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:I562n:B15l:o cnote: kfield 'nthreads' will be initialized after field 'tidInBlock'( thread I562d | x . x ) ,t igdr(otuipd()g,r onutph)r,e a d| s ^~~~~~~~~~~~~~~~~( nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:e562a:d60s:) ,note: field 'group' will be initialized after field 'stepSize't idInB l562o | c k ( t htrieda(dtIiddx).,x )n,t hgrreoaudps((gnrtohurpe)a,d s )| , ^~~~~~~~~~~~~~~~~ tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hI:n562B:l60o:c knote: (field 'group' will be initialized after field 'stepSize't hreadI d562x | . x ) , tgirdo(utpi(dg)r,o unpt)h,r e a| d ^~~~~~~~~~~s (nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthrea d562s | ( n t h rteiadd(st)i,d )t,i dnItnhBrleoacdks((tnhtrheraedaIddsx).,x )t,i dgIrnoBulpo(cgkr(otuhpr)e,a d I| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~x . x| ) tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T), group (563g | r o u p )s,t e p| S ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~i z e| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)n cclShm e563m | . c o m ms.tbeupfSfiSziez(ensc[cNlCSChLm_ePmR.OcToOm_mS.IbMuPfLfES]i/zNeCsC[LN_CSCTLE_PPSR/OsTiOz_eSoIfM(PTL)E)] /{N C C| L ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~_ S T| E group(groupP S/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 677 : 11 : note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here prims(tid ,677 | n T h r e a d s G a tphreirm,s (dtiirde-ctti-d>Sutpa,r tNBUcLaLs,t ,a rngTsh-r>esaednsdBbcuafsft,, a&rdgisr-e>crte-c>vobuutf,f ,d i r| e ^c t->down, a/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:g202s:-53>:s enote: nin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hered buff, 202a | r g s - > r e c vRbuunfWfo,r k E| l ^e ment, 2, 2>::run' requested herep , Alg o202, | P r o t o > ( )R.urnuWno(rwkeE)l;e m e| n ^t , 2, 2>::run' requested here Algo, 6P | rIoMtPoL>_(C)O.LrLu_nF(UweN)C;( A l| l ^R educe, C/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppO:L7L:N1E:T _note: Din instantiation of member function 'RunWork, 2, 2>::run' requested hereI RECT, 7S | IIMMPPLLE,_ CMOiLnL,_ FiUnNtC3(2A_ltl)R e d| u^c e, COLL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hN:E391T:_95D:I Rnote: Eexpanded from macro 'IMPL_COLL_FUNC'C T, SIMPL E391, | M iRnu,n Wuoirnkt<3n2c_ctl)F u n| c^# #func,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :t391y:p95e:, note: Fexpanded from macro 'IMPL_COLL_FUNC'u nc##devr e391d | o p rk,< nNcCcClLF_uAnLcG#O#_f#u#nacl,g ot,y pNeC,C LF_uPnRcO#T#Od_e#v#rperdootpo<>t(y)p.er>u,n (N&CnCcLc_lASLhGmOe_m#.#waolrgko),; N\C C L| _ ^P ROTO_##pro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:o562>:(15):. rnote: ufield 'nthreads' will be initialized after field 'tidInBlock'n (&nccl S562h | m e m . wtoirdk()t;i d\) , | n ^t hreads(n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:h562r:e15a:d snote: )field 'nthreads' will be initialized after field 'tidInBlock', tidIn B562l | o c k ( tthirde(atdiIdd)x,. xn)t,h rgeraodusp((ngtrhoruepa)d,s ) ,| ^~~~~~~~~~~~~~~~~t idI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:B562l:o60c:k (note: tfield 'group' will be initialized after field 'stepSize'h readId x562. | x ) , grtoiudp((tgirdo)u,p )n,t h r| e ^~~~~~~~~~~~~~~~~a ds(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:t562h:r60e:a dnote: s)field 'group' will be initialized after field 'stepSize', tidIn B562l | o c k ( tthirde(atdiIdd)x,. xn)t,h rgeraodusp((ngtrhoruepa)d,s ) ,| ^~~~~~~~~~~t idInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSize/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hn:c562c:l15S:h mwarning: einitializer order does not match the declaration order [-Wreorder-ctor]m .comm.buffSizes[N C562C | L _ P R OtTiOd_(StIiMdP)L,E ]n/tNhCrCeLa_dSsT(EnPtSh/rseiazdeso)f,( Tt)i)d I{n B l| o ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~c k (| t group(grouph readIdx.x), gr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ho:u687p:(11g:r onote: up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herethread Idx.x), group(gro u687p | ) , | ^~~~~~~~~~~ prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hreads), :t562i:d15I:n Bwarning: linitializer order does not match the declaration order [-Wreorder-ctor]o ck(threadIdx.x), group( g562r | o u p ) ,t i d| ( ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t i d| ) tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T), nthreads(nthre a563d | s ) , tsitdeIpnSBilzoec(kn(ctchlrSehamdeImd.xc.oxm)m,. bgurfofuSpi(zgerso[uNpC)C,L _ P| R ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~O T O| _ tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)S IMPLE] /563N | C C L _ SsTtEePpSS/isziez(enocfc(lTS)h)m e{m . c| o ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~m m .| b group(groupu ffSizes[NCCL_PROTO_SIMPLE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h]:/641N:C11C:L _note: Sin instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereT EPS/size o641f | ( T ) ) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ p r| i group(groupm s(tid-tidStartReduce, n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hT:h666r:e9a:d snote: Rin instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heree duce, d666i | r e c t - > d o wpnr,i m&sd(itriedc,t -n>Tohurte,a dasrGgast-h>esre,n ddbiurfefc,t -a>rugps,- >NrUeLcLv,b uafrfg,s - >| s ^e ndbuff, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ha:r202g:s53-:> rnote: ein instantiation of member function 'RunWorkElement, 2, 2>::run' requested herec vbuff ,202 | | ^ RunW/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ho:r202k:E53l:e mnote: ein instantiation of member function 'RunWorkElement, 2, 2>::run' requested heren t<(F)n.,r uTn,( wRee)d;O p ,| ^A lgo, Pro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppt:o10>:(1):. rnote: uin instantiation of member function 'RunWork, 2, 2>::run' requested heren (we); 10 | | I ^M PL_COLL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp_:F9U:N1C:( Anote: lin instantiation of member function 'RunWork, 2, 2>::run' requested herel Reduc e9, | ICMOPLLL_NCEOTL_LD_IFRUENCCT(,A lSlIRMePdLuEc,e ,M iCnO,L LhNaElTf_)D I R| E^C T, SIMP/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hL:E391,: 95M:i nnote: ,expanded from macro 'IMPL_COLL_FUNC' uint64_ t391) | | R^u nWorkn,c ,N CtCyLp_eA,L GFOu_n#c##a#ldgeov,r eNdCoCpL__,# #NpCrCoLt_oA>L(G)O._r#u#na(l&gnoc,c lNSChCmLe_mP.work);R O\T O _| # ^# proto>(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h):.562r:u15n:( ¬e: nfield 'nthreads' will be initialized after field 'tidInBlock'c clShmem .562w | o r k ) ;t i\d ( t| i ^d ), nthre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ha:d562s:(15n:t hnote: rfield 'nthreads' will be initialized after field 'tidInBlock'e ads), t562i | d I n B ltoicdk((ttihdr)e,a dnItdhxr.exa)d,s (gnrtohurpe(agdrso)u,p )t,i d I| n ^~~~~~~~~~~~~~~~~B loc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hk:(562t:h60r:e anote: dfield 'group' will be initialized after field 'stepSize'I dx.x), 562g | r o u p (tgirdo(utpi)d,) , | n ^~~~~~~~~~~~~~~~~t hre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ha:d562s:(60n:t hnote: rfield 'group' will be initialized after field 'stepSize'e ads), t562i | d I n B ltoicdk((ttihdr)e,a dnItdhxr.exa)d,s (gnrtohurpe(agdrso)u,p )t,i d I| n ^~~~~~~~~~~B lock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllRedu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562562 | : 15 : warning: tinitializer order does not match the declaration order [-Wreorder-ctor]i d(tid), nthread s562( | n t h r etaidds()t,i dt)i,d InntBhlroecakd(st(hnrtehardeIaddxs.)x,) ,t igdrIonuBpl(ogcrko(utph)r,e a d| I ^~~~~~~~~~~d x.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, ar/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hgs:-562>:r15e:c vwarning: binitializer order does not match the declaration order [-Wreorder-ctor]u ff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h562: | 202 : 53 : tnote: iin instantiation of member function 'RunWorkElement, 2, 2>::run' requested hered (tid) ,202 | n t h r e a d s (RnutnhWroerakdEsl)e,m etnitdp(()g.rrouunp()w,e ) ;| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | ^| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp :56310 | : 1 : note: sin instantiation of member function 'RunWork, 2, 2>::run' requested heret epSiz e10( | nIcMcPlLS_hCmOeLmL._cFoUmNmC.(bAulflfRSeidzuecse[,N CCCOLL_LPNREOTT_OD_ISRIEMCPTL,E ]S/INMCPCLLE_,S TMEiPnS,/ shiazlefo)f ( T| )^) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 391| : group(group95 : note: expanded from macro 'IMPL_COLL_FUNC' 391 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 677R:u11n:W onote: rin instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herek t,, NnCTChLr_eAaLdGsOB_c#a#satl,g o&,d iNrCeCcLt_-P>RoOuTtO,_ #d#iprreoctto->>(d)o.wrnu,n (a&rngcsc-l>Sshemnedmb.uwfofr,k )a;r g\s - >| r ^e cvbuff/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h,: 562 :| 15 ^: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202: 53562: | note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here tid( t202i | d ) , n t h r eRaudnsW(onrtkhErleeamdesn)t,< Ftni,d ITn,B lRoecdkO(pt,h rAelagdoI,d xP.rxo)t,o >g(r)o.urpu(ng(rwoeu)p;) , | ^| ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp::6011:: 1note: :field 'group' will be initialized after field 'stepSize' note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 562 | 11 | I M PtLi_dC(OtLiLd_)F,U NnCt(hArlelaRdesd(uncteh,r eCaOdLsL)N,E Tt_iDdIIRnEBClTo,c kS(ItMhPrLeEa,d IMdixn.,x )f,l ogarto)u p (| g^r oup), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :| 391 ^~~~~~~~~~~: 95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ cclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL:_562P:R15O:T Owarning: _initializer order does not match the declaration order [-Wreorder-ctor]S IMPLE]/NCCL_STE P562 | S / s i zteiodf((tTi)d)) ,{ n t| h ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r e a| d group(groups (nthreads), tidI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hn:B626l:o9c:k (note: tin instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereh readIdx. x626) | , g r o u p ( gprroiumps)(,t i d| - ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t i d| S tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)t artSca t563t | e r , nsTtherpeSaidzseS(cnactctleSrh,m eNmU.LcLo,m md.ibruefcftS-i>zueps,[ NaCrCgLs_-P>RsOeTnOd_bSuIfMfP,L Ea]r/gNsC-C>Lr_eScTvEbPufSf/,s i z| e ^o f(T)) {/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 202| : ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~53 : | note: group(groupin instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h : 677R:u11n:W onote: rin instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herek Element< F677n | , T , R e d O p ,p rAilmgso,( tPirdo-ttoi>d(S)t.arrutnB(cwaes);t , | n ^T hreadsB/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppc:a11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested heres t, &d i11r | eIcMtP-L>_oCuOtL,L _dFiUNrCe(cAtl-l>Rdeodwunc,e ,a rCgOsL-L>NsEeTn_dDbIuRfEfC,T ,a rSgIsM-P>LrEe,c vMbiunf,f ,f l o| a ^t ) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h53::391 :note: 95in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here: note: expanded from macro 'IMPL_COLL_FUNC' 202 | 391 | R uRnuWnoWrokrEkle(d)o.pr),; N C| C ^L _ALGO_##/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppa:l11g:o1,: Nnote: Cin instantiation of member function 'RunWork, 2, 2>::run' requested hereC L_PRO T11O | _I#M#PpLr_oCtOoL>L(_)F.UrNuCn((A&lnlcRceldSuhcmee,m .CwOoLrLkN)E;T _\D I R| E ^C T, SIM/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hP:L562E:,15: Mnote: ifield 'nthreads' will be initialized after field 'tidInBlock'n , floa t562) | | ^ tid(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hi:d391):,95 :n tnote: hexpanded from macro 'IMPL_COLL_FUNC'r eads(nt h391r | e a dRsu)n,W otrikd,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :N562C:C60L: _note: Afield 'group' will be initialized after field 'stepSize'L GO_##a l562g | o , N CtCiLd_(PtRiOdT)O,_ #n#tphrroetaod>s(()n.trhurne(a&dnsc)c,l SthimdeImn.Bwloorckk)(;t h\r e a| d ^I dx.x),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :g562r:o15u:p (note: gfield 'nthreads' will be initialized after field 'tidInBlock'r oup), 562| | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h687 | : 562 : 15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] prims(tid-t i562d | S t a r ttBicda(stti,d )n,T hnrtehardesaBdcsa(sntt,h r&edaidrse)c,t -t>ioduItn,B lnouclkl(ptthrr,e aadrIgdsx-.>xs)e,n dgbruofufp,( garrogusp-)>,r e c| v ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~b u f| f tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T), | ^ 563 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hs:t202e:p53S:i znote: ein instantiation of member function 'RunWorkElement, 2, 2>::run' requested here( ncclS h202m | e m . c o m m . bRuufnfWSoirzkeEsl[eNmCeCnLt_i(z)e.orfu(nT()w)e ){; | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ ^ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9 :10 | note: Iin instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereM PL_COL L666_ | F U N C ( A l l Rperdiumcse(,t iCdO,L LnNTEhTr_eDaIdRsEGCaTt,h eSrI,M PdLiEr,e cMti-n>,u ph,a lNfU)L L ,| ^a rgs->s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:n391d:b95u:f fnote: ,expanded from macro 'IMPL_COLL_FUNC' args->re c391v | b u fRfu,n W o| r ^k , 2, 2>::run' requested here, type ,202 | F u n c # # d e vRruendWoopre,n tNO(_)#.#rpurno(twoe>)(;) . r| u ^n (&ncclSh/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cppm:e12m:.1w:o rnote: kin instantiation of member function 'RunWork, 2, 2>::run' requested here) ; \ | 12 ^ | IMPL_COL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL:_562F:U15N:C (note: Afield 'nthreads' will be initialized after field 'tidInBlock'l lReduc e562, | C O L LtNiEdT(_tDiIdR)E,C Tn,t hSrIeMaPdLsE(,n tMhirne,a ddso)u,b ltei)d I n| B^l ock(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hh:r391e:a95d:I dnote: xexpanded from macro 'IMPL_COLL_FUNC'. x), gro u391p | ( g rRouunpW)o,r k <| n ^~~~~~~~~~~~~~~~~c clF/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hu:n562c:#60#:f unote: nfield 'group' will be initialized after field 'stepSize'c , type ,562 | F u n c #t#idde(vtriedd)o,p a,d sN(CnCtLh_rAeLaGdOs_)#,# atligdoI,n BNlCoCcLk_(PtRhOrTeOa_d#I#dpxr.oxt)o,> (g)r.oruupn((g&rnocucpl)S,h m e| m ^~~~~~~~~~~. work); \ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h15: warning: initializer order does not match the declaration order [-Wreorder-ctor]: 562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), n t562h | r e a d st(indt(htrieda)d,s )n,t htriedaIdnsB(lnotchkr(etahdrse)a,d Itdixd.Ixn)B,l ogcrko(utph(rgeraoduIpd)x,. x )| , ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ g r| o tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)u p(grou p563) | , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~s t e| p tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)S ize(nc c563l | S h m e ms.tceopmSmi.zbeu(fnfcScilzSehsm[eNmC.CcLo_mPmR.ObTuOf_fSSIiMzPeLsE[]N/CNCCLC_LP_RSOTTEOP_SS/IsMiPzLeEo]f/(NTC)C)L _{S T E| P ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~S / s| i group(groupz eof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :641655 | : 11 : note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here pri m655s | ( t i d - t i d S t aprrtiRmesd(utcied,- tniTdhSrteaardtsRReedduuccee,, ndTihrreecatd-s>Rdeodwunc,e ,& dniurlelcptt-r>,o u&td,i raercgts-->>osuetn,d baurfgfs,- >asregnsd-b>urfefc,v baurfgfs,- > r| e ^c vbuff, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h| : ^202 :53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202: 53202: | note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here R202u | n W o r k E l e mReunntWl(g)o.,r uPnr(owteo)>;( ) .| r ^u n(we); /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp :| 10 ^: 1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10 :101 | :I Mnote: Pin instantiation of member function 'RunWork, 2, 2>::run' requested hereL _COL L10_ | FIUMNPCL(_AClOlLRLe_dFuUcNeC,( AClOlLRLeNdEuTc_eD,I RCEOCLTL,N ESTI_MDPILREE,C TM,i nS,I MhPaLlEf,) M i| n^, half) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :| 391^: 95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: 391expanded from macro 'IMPL_COLL_FUNC' | RunWor k391< | n c cRluFnuWnocr#k#/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h#,:d 562eN:vC15rC:eL d_note: oAfield 'nthreads' will be initialized after field 'tidInBlock'pL a562,l | g No C, C LNt_CiACdLL(G_tOPi_Rd#O)#T,aO l_ng#to#h,pr reNoaCtdCosL>(_(nP)tR.hOrrTueOna_(d#&s#n)pc,rc olttSiohd>mI(en)mB..lrwouocnrk(k(&)tn;hc rc\el aS dh| Im ^de xm..xw)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho,:r 562kg:)r15;o: u \pnote: (field 'nthreads' will be initialized after field 'tidInBlock' g | r ^o u p562) | , /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :| 562 ^~~~~~~~~~~~~~~~~t: i15d:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h( :tnote: 562ifield 'nthreads' will be initialized after field 'tidInBlock':d 60):, note: nfield 'group' will be initialized after field 'stepSize'562t | h r e a562 d | ts i( dn (t thtirided)a(,dt sin)dt,)h ,rt einadtdIhsnr(Benlatodhcsrk(e(nattdhhsrr)ee,aa ddtIsid)dx,I. nxtB)il,do IcgnkrB(oltuohpcr(keg(artdohIurdpex)a.,dx I) d,| x ^~~~~~~~~~~~~~~~~.g xr)o/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h,u: p562g(:rg60or:uo punote: (pfield 'group' will be initialized after field 'stepSize'g) r,o u p562| ) | ^~~~~~~~~~~~~~~~~, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h| : ^~~~~~~~~~~t562 i:d60(:t inote: dfield 'group' will be initialized after field 'stepSize') , nthr e562a | d s ( n tthirde(atdisd)),, tnitdhIrneBaldosc(kn(tthhrreeaaddsI)d,x .txi)d,I ngBrlooucpk((gtrhoruepa)d,I d x| . ^~~~~~~~~~~x ), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15 391: | warning: initializer order does not match the declaration order [-Wreorder-ctor]R unWork,, NtCiCdLI_nABLlGoOc_k#(#tahlrgeoa,d INdCxC.Lx_)P,R OgTrOo_u#p#(pgrrootuop>)(,) . r| u ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~n ( &| n tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) cclShme m563. | w o r k )s;t e\p S i| z ^e (nccl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hS:h562m:e15m:. cnote: ofield 'nthreads' will be initialized after field 'tidInBlock'm m.buff S562i | z e s [ NtCiCdL(_tPiRdO)TO,_ nStIhMrPeLaEd]s/(NnCtChLr_eSaTdEsP)S,/ stiizdeIonfB(lTo)c)k ({t h r| e ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~a d I| d group(groupx .x), group(group), | ^~~~~~~~~~~~~~~~~/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h :687:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h11::562 :note: 60in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here: note: field 'group' will be initialized after field 'stepSize' 687 | 562 | t i d ( tpirdi)m,s (nttihdr-etaiddsS(tnatrhtrBecaadsst),, ntTihdrIenaBdlsoBccka(stth,r e&addiIrdexc.tx-)>,o ugtr,o unpu(lglrpoturp,) ,a r g| s ^~~~~~~~~~~- >sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllRe/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ duce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::562391::1595:: warning: note: initializer order does not match the declaration order [-Wreorder-ctor]expanded from macro 'IMPL_COLL_FUNC' 391 | Run W562o | r k < n ctcildF(utnicd#)#,f unntch,r etaydpse(,n tFhurneca#d#sd)e,v rteiddoIpn(,t hNrCeCaLd_IAdLxG.Ox_)#,# aglrgoou,p (NgCrCoLu_pP)R,O T O| _ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~# # p| r tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)o to>(). r563u | n ( & n csctleSphSmiezme.(wnocrckl)S;h m\e m .| c ^o mm.bu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hf:f562S:i15z:e snote: [field 'nthreads' will be initialized after field 'tidInBlock'N CCL_PR O562T | O _ S I MtPiLdE(]t/iNdC)C,L _nStThErPeSa/dssi(znetohfr(eTa)d)s ){, t| i ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~d I n| B group(groupl ock(threadIdx.x)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h,: 677g:r11o:u pnote: (in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereg roup), | 677 ^~~~~~~~~~~~~~~~~ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 : 60 : note: pfield 'group' will be initialized after field 'stepSize'r ims(ti d562- | t i d S ttairdt(Btciads)t,, nntThhrreeaaddss(Bnctahsrte,a d&sd)i,r etcitd-I>noBulto,c kd(itrherceta-d>Iddoxw.nx,) ,a rggrso-u>ps(egnrdobuupf)f,, a| r ^~~~~~~~~~~g s->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx908. 67 warnings generated when compiling for gfx941. 67 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for host. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:626:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 626 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:641:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 641 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:655:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 655 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:666:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 666 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:677:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 677 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:687:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 687 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_DIRECT, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 67 warnings generated when compiling for gfx1030. 67 warnings generated when compiling for gfx906. 67 warnings generated when compiling for gfx1101. 67 warnings generated when compiling for gfx803. 67 warnings generated when compiling for gfx1102. 67 warnings generated when compiling for gfx900. 67 warnings generated when compiling for gfx1100. 67 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 8 warnings generated when compiling for gfx908. 8 warnings generated when compiling for gfx940. 8 warnings generated when compiling for gfx1100. 8 warnings generated when compiling for gfx1101. 8 warnings generated when compiling for gfx941. 8 warnings generated when compiling for gfx1102. 8 warnings generated when compiling for gfx900. 8 warnings generated when compiling for gfx1030. 8 warnings generated when compiling for gfx906. 8 warnings generated when compiling for gfx803. 8 warnings generated when compiling for gfx90a. 8 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllToAllPivot, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 8 warnings generated when compiling for host. 8 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h| : ^562 :15: warning: initializer order does not match the declaration order [-Wreorder-ctor]/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | 562 | tRiudn(Wtoirdk)E,l enmtehnrtet(h)r.eraudnI(dwxe.)x;) , | g ^r oup(group)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp,: 10 :| 1 ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~: note: | in instantiation of member function 'RunWork, 3, 2>::run' requested here tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 10 | I563M | P L _ C OsLtLe_pFSUiNzCe((AnlclcRleSdhumceem,. cCoOmLmL.NbEuTf_fCSHiAzIeNs,[ NSCICMLP_LPER,O TSOu_mS,I MhPaLlEf])/ N C| C^L _STEPS/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h/:s391i:z95e:o fnote: (expanded from macro 'IMPL_COLL_FUNC'T )) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 391 | | group(group RunWork, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here, Func# #916d | e v r e d o ppg,r oNuCpCTLi_dA,L GgOr_o#u#paNltghor,e aNdCsC,L _&PrReOcTvO,_ #&#spernodt,o >a(r)g.sr-u>ns(e&nndcbculfSfh,m eamr.gwso-r>kr)e;c v\b u f| f ^, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::562202::1553:: note: note: field 'nthreads' will be initialized after field 'tidInBlock'in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202562 | | t i d (RtuindW)o,r knEtlhermeeandts<(Fnnt,h rTe,a dRse)d,O pt,i dAIlngBol,o cPkr(otthor>e(a)d.Irduxn.(xw)e,) ;g r o| u ^p (group), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp :| 11 ^~~~~~~~~~~~~~~~~: 1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hnote: :in instantiation of member function 'RunWork, 3, 2>::run' requested here562 :60: note: field 'group' will be initialized after field 'stepSize'11 | IMPL_ C562O | L L _ F UtNiCd((AtlildR)e,d uncteh, rCeOaLdLsN(EnTt_hCrHeAaIdNs,) ,S ItMiPdLIEn,B lSoucmk,( tfhlroeaatd)I d x| .^x ), grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hp:(391g:r95o:u pnote: )expanded from macro 'IMPL_COLL_FUNC', | ^~~~~~~~~~~ 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx941. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:109:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 109 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Broadcast, RING, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:109:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 109 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Broadcast, RING, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1100. 8 warnings generated when compiling for gfx90a. 8 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx803. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ , flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInIn file included from B/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cppl:o1c: kIn file included from (/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.ht:h9r: eIn file included from a/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.hd:I167d: x/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h.:x562):,15 :g rwarning: oinitializer order does not match the declaration order [-Wreorder-ctor]u p(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 8 warnings generated when compiling for gfx941. 8 warnings generated when compiling for gfx908. 8 warnings generated when compiling for gfx940. 8 warnings generated when compiling for gfx906. 8 warnings generated when compiling for gfx90a. 8 warnings generated when compiling for gfx900. 8 warnings generated when compiling for gfx1030. 8 warnings generated when compiling for gfx1102. 8 warnings generated when compiling for gfx1101. 8 warnings generated when compiling for gfx803. 8 warnings generated when compiling for gfx90a. 8 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:9: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:53:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 53 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 95 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Broadcast, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 8 warnings generated when compiling for host. 8 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, dIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ ata2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h514: | 514 : 9 : iwarning: nvariable 'offset' set but not used [-Wunused-but-set-variable]t offset =514 | t i d ; i n| t ^ offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(Reduce, RING, LL128, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ RedOp, ProtoLL128>(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(Reduce, RING, LL128, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hea:d562s:)15,: twarning: iinitializer order does not match the declaration order [-Wreorder-ctor]d InBlock(threa d562I | d x . x )t,i dg(rtoiudp)(,g rnotuhpr)e,a d s| ( ^~~~~~~~~~~~~~~~~n th/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:e562a:d60s:) ,note: field 'group' will be initialized after field 'stepSize't idInBl o562c | k ( t h rteiadd(Itdixd.)x,) ,n tghrroeuapd(sg(rnotuhpr)e,a d s| ) ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, t| i tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)d InBlock (563t | h r e a dsItdexp.Sxi)z,e (gnrcoculpS(hgmreomu.pc)o,m m .| b ^~~~~~~~~~~u ffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FU/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hc:c562l:S15h:m ewarning: minitializer order does not match the declaration order [-Wreorder-ctor]. work); \ | ^ 562 | tid(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hi:d562):,15 :n tnote: hfield 'nthreads' will be initialized after field 'tidInBlock'r eads(nthr e562a | d s ) , ttiidd(ItniBdl)o,c kn(tthhrreeaaddsI(dnxt.hxr)e,a dgsr)o,u pt(igdrIonuBpl)o,c k (| t ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~h r e| a tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)d Idx.x) ,563 | g ro u p (gsrtoeuppS)i,z e (| n ^~~~~~~~~~~~~~~~~c clS/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hh:m562e:m60.:c onote: mfield 'group' will be initialized after field 'stepSize'm .buffS i562z | e s [ N CtCiLd_(PtRiOdT)O,_ SnItMhPrLeEa]d/sN(CnCtLh_rSeTaEdPsS)/,s itziedoIfn(BTl)o)c k{( t h| r ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~e a d| group(groupI dx.x), group(gr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ho:u916p:)7,: note: | in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here ^~~~~~~~~~~ 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, CO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hLLNET_C:H562A:I15N:, warning: Sinitializer order does not match the declaration order [-Wreorder-ctor]I MPLE, Max, half) | ^ 562 | tid(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hi:d391):,95 :n tnote: hexpanded from macro 'IMPL_COLL_FUNC'r eads(nthreads )391, | t iRduInnWBolrokc ,563 | N C C L _sAtLeGpOS_i#z#ea(lngcoc,l SNhCmCeLm_.PcRoOmTmO._b#u#fpfrSoitzoe>s([)N.CrCuLn_(P&RnOcTcOl_SShImMePmL.Ew]o/rNkC)C;L _\S T E| P ^S /sizeof(T)) { /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h| : ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~562 : 15| : group(group note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.ht:i916d:)7,: nnote: tin instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested hereh reads( n916t | h r e a d s )p,r itmisd(IgnrBoluopcTki(dt,h rgeraoduIpdNxt.hxr)e,a dgsr,o u&pr(egcrvo,u p&)s,e n d| , ^~~~~~~~~~~~~~~~~ arg/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hs:-562>:s60e:n dnote: bfield 'group' will be initialized after field 'stepSize'u ff, ar g562s | - > r e ctvibdu(ftfi,d ) ,| ^n threads(n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:h202r:e53a:d snote: )in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here, tidI n202B | l o c k ( t h r eRaudnIdWxo.rxk)E,l egmreonutp<(Fgnr,o uTp,) ,R e d| O ^~~~~~~~~~~p , Algo, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:i562d:(15t:i dwarning: )initializer order does not match the declaration order [-Wreorder-ctor], nthreads(nthrea d562s | ) , t itdiIdn(Btliodc)k,( tnhtrheraedaIddsx(.nxt)h,r egardosu)p,( gtrioduIpn)B,l o c| k ^~~~~~~~~~~~~~~~~( th/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:e562/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:60:: 562note: :15field 'group' will be initialized after field 'stepSize': warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | 562 | t itdi(dt(itdi)d,) ,n tnhtrheraedasd(sn(tnhtrheraedasd)s,) ,t itdiIdnIBnlBolcokc(kt(htrheraedaIddIxd.xx.)x,) ,g rgoruopu(pg(rgoruopu)p,) , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~| ^~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx941. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(Reduce, RING, LL128, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threIn file included from a/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cppd:I1d: xIn file included from ./usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hx:)10,: In file included from g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.hr:o167u: p/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:g562r:o15u:p )warning: ,initializer order does not match the declaration order [-Wreorder-ctor] | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx940. 13 warnings generated when compiling for gfx941. 13 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 13 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for host. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx1030. 13 warnings generated when compiling for gfx1101. 13 warnings generated when compiling for gfx803. 13 warnings generated when compiling for gfx1102. 13 warnings generated when compiling for gfx906. 13 warnings generated when compiling for gfx1100. 13 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, LL128, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, LL128, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, LL128, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, LL128, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, LL128, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, LL128, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, LL128, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, LL128, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, LL128, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, LL128, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, LL128, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, LL128, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 13 warnings generated when compiling for gfx90a. 13 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx908. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(Reduce, RING, LL128, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx942. 7 warnings generated when compiling for host. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:94:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 94 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(Reduce, RING, LL128, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we )562; | | ^ tid(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cppt:i9:d1):, note: nin instantiation of member function 'RunWork, 3, 2>::run' requested heret hread s9( | nItMhPrLe_aCdOsL)L,_ FtUiNdCI(nABllloRcekd(utcher,e aCdOILdLxN.ExT)_,C HgArIoNu,p (SgIrMoPuLpE),, M i| n ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, u| i tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)n t64_t) 563 | | ^ ste/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hp:S391i:z95e:( nnote: cexpanded from macro 'IMPL_COLL_FUNC'c lShmem.c o391m | m . bRuufnfWSoirzke ,{ N C| C ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~L _ A| L group(groupG O_##algo, NCCL_PROTO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h_:#916#:p7r:o tnote: oin instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here> ().run (916& | n c c l S h mpermi.mwso(rgkr)o;u p\T i d| , ^ groupN/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:h562r:e15a:d snote: ,field 'nthreads' will be initialized after field 'tidInBlock' &recv, 562& | s e n d ,t iadr(gtsi-d>)s,e nndtbhurfefa,d sa(rngtsh-r>eraedcsv)b,u ftfi,d I n| B ^l ock(th/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:e202a:d53I:d xnote: .in instantiation of member function 'RunWorkElement, 3, 2>::run' requested herex ), gr o202u | p ( g r o u p ) ,R u n| W ^~~~~~~~~~~~~~~~~o rkE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hl:e562m:e60n:t t(h)r.eraudns((wnet)h;r e a| d ^s ), tidI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cppn:B11l:o1c:k (note: tin instantiation of member function 'RunWork, 3, 2>::run' requested hereh readI d11x | .IxM)P,L _gCrOoLuLp_(FgUrNoCu(pA)l,l R e| d ^~~~~~~~~~~u ce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem./usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx803. 17 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp::11: : In file included from In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h::1010: : In file included from In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h::168168: : /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h::153153::1414:: warning: warning: unused variable 'data1' [-Wunused-variable]unused variable 'data1' [-Wunused-variable] 153153 | | uuiinntt3322__tt ddaattaa11,, ffllaagg11,, ddaattaa22,, ffllaagg22;; | | ^~~~~ ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h::153153::2121:: warning: warning: unused variable 'flag1' [-Wunused-variable]unused variable 'flag1' [-Wunused-variable] 153153 | | uuiinntt3322__tt ddaattaa11,, ffllaagg11,, ddaattaa22,, ffllaagg22;; | | ^~~~~ ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h::153153::2828:: warning: warning: unused variable 'data2' [-Wunused-variable]unused variable 'data2' [-Wunused-variable] 153153 | | uuiinntt3322__tt ddaattaa11,, ffllaagg11,, ddaattaa22,, ffllaagg22;; | | ^~~~~ ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h::153153::3535:: warning: warning: unused variable 'flag2' [-Wunused-variable]unused variable 'flag2' [-Wunused-variable] 153153 | | uuiinntt3322__tt ddaattaa11,, ffllaagg11,, ddaattaa22,, ffllaagg22;; | | ^~~~~ ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h warning: :initializer order does not match the declaration order [-Wreorder-ctor]562 :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562562 | | ttiidd((ttiidd)),, nntthhrreeaaddss((nntthhrreeaaddss)),, ttiiddIInnBBlloocckk((tthhrreeaaddIIddxx..xx)),, ggrroouupp((ggrroouupp)),, | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563563 | | sstteeppSSiizzee((nnccccllSShhmmeemm..ccoommmm..bbuuffffSSiizzeess[[NNCCCCLL__PPRROOTTOO__SSIIMMPPLLEE]]//NNCCCCLL__SSTTEEPPSS//ssiizzeeooff((TT)))) {{ | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | | group(group group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h::916916::77:: note: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested herein instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916916 | | pprriimmss((ggrroouuppTTiidd,, ggrroouuppNNtthhrreeaaddss,, &&rreeccvv,, &&sseenndd,, aarrggss-->>sseennddbbuuffff,, aarrggss-->>rreeccvvbbuuffff,, | | ^ ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::202202::5353:: note: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested herein instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202202 | | RRuunnWWoorrkkEElleemmeenntt<>(())..rruunn((wwee));; | | ^ ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp4::51::1 :note: in instantiation of member function 'RunWork, 3, 2>::run' requested herenote: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | 5I | MIPMLP_LC_OCLOLL_LF_UFNUCN(CA(lAllRleRdeudcuec,e ,C OCLOLLNLENTE_TC_HCAHIANI,N ,S ISMIPMLPEL,E ,P rPerMeuMluSluSmu,m ,i nuti8n_tt8)_ t )| ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::95391:: 95note: :expanded from macro 'IMPL_COLL_FUNC' note: expanded from macro 'IMPL_COLL_FUNC' 391 | 391 | R u nRWuonrWkop,e >N,C CNLC_CALL_GAOL_G#O#_a#l#gaol,g oN,C CNLC_CPLR_OPTROO_T#O#_p#r#optroo>t(o)>.(r)u.nr(u&nn(c&cnlcSchlmSehmm.ewmo.rwko)r;k )\; \| ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :note: 562field 'nthreads' will be initialized after field 'tidInBlock': 15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | 562t | i d ( t itdi)d,( tnitdh)r,e andtsh(rnetahdrse(andtsh)r,e atdisd)I,n BtliodcIkn(Btlhorceka(dtIhdrxe.axd)I,d xg.rxo)u,p (ggrroouupp()g,r o u| p ^~~~~~~~~~~~~~~~~) , | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h ^~~~~~~~~~~~~~~~~: 562:60/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:: 562note: :field 'group' will be initialized after field 'stepSize'60 : note: field 'group' will be initialized after field 'stepSize' 562 | t562i | d ( t i dt)i,d (nttihdr)e,a dnst(hnrtehardesa(dnst)h,r etaiddsI)n,B ltoicdkI(ntBhlroecakd(Itdhxr.exa)d,I dgxr.oxu)p,( ggrroouupp)(,g r o| u ^~~~~~~~~~~p ), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tiIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &re/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ cv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulS/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ um, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ A562L | G O _ # #taildg(ot,i dN)C,C Ln_tPhRrOeTaOd_#s#(pnrtohtroe>a(d)s.)r,u nt(i&dnIcncBllSohcmekm(.twhorreka)d;I d\x . x| ) ^, group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15 :563/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : | note: 562 field 'nthreads' will be initialized after field 'tidInBlock': 15 : swarning: tinitializer order does not match the declaration order [-Wreorder-ctor]e p S562i | z e ( n562 c | tc il dS (h tmtieidmd).(,ct oinmdtm)h.,rb eunaftdfhsSr(ienzatedhssr[(eNnaCtdChsLr)_e,Pa RdtOsiT)dO,I_ nStBIilMdoPIcLnkEB(]lt/ohNcrCkeC(aLtd_hISrdTexEa.PdxSI)/d,sx i.gzxre)oo,uf p(g(Trg)or)uo pu{(p g) r,| o ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~u p| ) ^~~~~~~~~~~~~~~~~| , group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h| : ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~562 : 60| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) note: field 'group' will be initialized after field 'stepSize' 563 | 562 | s t etpiSdi/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h(z:te916i(:dn7)c:,c lnote: nSin instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested hereth hmreema.d cs916o( | mn mt .h br ue fa fdpSsri)iz,me sst([igNdrCIoCnuLBp_lTPoiRcdOk,T( Otg_hrSroIeuMapPdNLItEdh]xr/.eNxaC)dC,sL ,_g Sr&TorEuePpcS(v/g,sr io&zusepeo)nf,d( ,T )| a) ^~~~~~~~~~~r g{s - >| s ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~e n d| group(groupb uff, args->recvbu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.hf:f916,: 7 :| ^note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53 :916 | note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here p r202i | m s ( g r o u p TRiudn,W ogrrkoEulpeNmtehnrteos>e(n)d.bruufnf(,w ea)r;g s -| > ^r ecvbuff, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp :| 13 ^: 1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :202:53: note: 13in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here | IMPL_ C202O | L L _ F U N C ( ARlulnRWeodrukcEel,e mCeOnLtLu(m),. rrucnc(lw_eb)f;l o a| t ^1 6) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :391:95: note: 13expanded from macro 'IMPL_COLL_FUNC' | IMPL_COL L391_ | F U NRCu(nAWlolrRkec,l _NbCfClLo_aAtL1G6O)_ # #| a^l go, N/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hC:C391L:_95P:R Onote: Texpanded from macro 'IMPL_COLL_FUNC'O _##proto >391( | ) . rRuunn(W&onrckc, 562N | C C L _ AtLiGdO(_t#i#da)l,g on,t hNrCeCaLd_sP(RnOtThOr_e#a#dpsr)o,t ot>i(d)I.nrBulno(c&kn(ctchlrSehamdeImd.xw.oxr)k,) ;g r\o u p| ( ^g roup/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h):,562 : 15| : ^~~~~~~~~~~~~~~~~ note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: 562note: | field 'group' will be initialized after field 'stepSize' tid (562t | i d ) , tnitdh(rteiadd)s,( nnthtrheraedasd)s,( nttihdrIenaBdlso)c,k (ttihdrIenaBdlIodcxk.(xt)h,r egardoIudpx(.gxr)o,u pg)r,o u p| ( ^~~~~~~~~~~~~~~~~g rou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hp:)562,: 60 :| ^~~~~~~~~~~note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx940. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/all_reduce.h:916:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 916 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | IMPL_COLL_FUNC(AllReduce, COLLNET_CHAIN, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx803. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] 563 | stepSize(n c562c | l S h m etmi.dc(otmim.db)u,f fnStihzreesa[dNsC(CnLt_hPrReOaTOd_sS)I,M PtLiEd]I/nNBClCoLc_kST(EtPhSr/esaidzIedoxf.(xT)),) g{r o u| p ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~( g r| o group(groupu p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h: 34563: | 7 : note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested heres tepSize(n c34c | l S h m e m .pcroimmms.(btuifdf,S inztehsr[eNaCdCsL,_ P&RrOiTnOg_-S>IpMrPeLvE,] /&NrCiCnLg_-S>TnEePxSt/,s iazregosf-(>Ts)e)n d{b u f| f ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~, a| r group(groupg s->recvbuff, args-/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h>:r34e:d7O:p Anote: rin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereg , 0, args -34> | c o n n I n dperxi,m sa(rtgisd-,> cnotnhnrIenaddesx,) ;& r i| n ^g /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h-:>80p:r5e:v ,note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here& rin g80- | > n e x tr,u naRrignsg-<>Ts,e nRdebduOfpf,, Parrogtso->>(raercgvsb)u;f f ,| ^a rgs->red/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hO:p202A:r53g:, note: 0in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here, args -202> | c o n n I n d e xR,u nWaorrgksE-l>ecmoennntI, ProtoSimple<1, 1>>' requested heret o>() .80r | u n ( w e)r;u n R| i ^n g, 1, 2>::run' requested hereo >(ar g6s | )I;M P L| _ ^C OLL_FUN/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hC:(202R:e53d:u cnote: ein instantiation of member function 'RunWorkElement, 1, 2>::run' requested here, RING ,202 | S I M P L E , SRuumnPWoosrtkDEilve,m einntt<3F2n_,t )T , | R^e dOp, A/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hl:g391o:,95 :P rnote: oexpanded from macro 'IMPL_COLL_FUNC't o>().run (391w | e ) ;R u n| W ^o rk, 1, 2>::run' requested heren c, ty p7e | ,I MFPuLn_cC#O#LdLe_vFrUeNdCo(pRe,, NRCCILN_GA,L GSOI_M#P#LaEl,g oS,u mNPCoCsLt_DPiRvO,T Ou_i#n#tp3r2o_tto)> ( )| .^r un(&nc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hc:l391S:h95m:e mnote: .expanded from macro 'IMPL_COLL_FUNC'w ork); \ 391| | ^ RunWo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:k562<:n15c: cnote: lfield 'nthreads' will be initialized after field 'tidInBlock'F unc##f u562n | c , t ytpied,( tFiudn)c,# #ndtehvrreeaddosp(a,d sN)C,C Lt_iAdLIGnOB_l#o#cakl(gtoh,r eNaCdCILd_xP.RxO)T,O _g#r#opurpo(tgor>o(u)p.)r,u n (| & ^~~~~~~~~~~~~~~~~n ccl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hS:h562m:e60m:. wnote: ofield 'group' will be initialized after field 'stepSize'r k); \ 562| | ^ tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:t562i:d15):, note: nfield 'nthreads' will be initialized after field 'tidInBlock't hreads (562n | t h r e atdisd)(,t itdi)d,I nnBtlhorceka(dtsh(rnetahdrIedaxd.sx)),, tgirdoIunpB(lgorcoku(pt)h,r e a| d ^~~~~~~~~~~I dx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx940. 13 warnings generated when compiling for gfx908. 13 warnings generated when compiling for gfx90a. 13 warnings generated when compiling for gfx90a. 13 warnings generated when compiling for gfx900. 13 warnings generated when compiling for gfx906. 13 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 13 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 13 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx1102. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx1030. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for host. 13 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NG, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWorkt,i dN(CtCiLd_)A,L GnOt_h#r#eaaldgso(,n tNhCrCeLa_dPsR)O,T Ot_i#d#IpnrBoltooc>k(()t.hrruena(d&Indcxc.lxS)h,m egmr.owuopr(kg)r;o u\p ) ,| ^ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T): 562:15: note: field 'nthreads' will be initialized after field 'tidInBlock'563 | s t562e | p S i z et(indc(ctliSdh)m,e mn.tchormema.dbsu(fnftShirzeeasd[sN)C,C Lt_iPdRIOnTBOl_oScIkM(PtLhEr]e/aNdCICdLx_.SxT)E,P Sg/rsoiuzpe(ogfr(oTu)p)) ,{ | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h| : group(group562 :60: note: field 'group' will be initialized after field 'stepSize' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h :t34i:d7(:t inote: din instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here) , nthread s34( | n t h r e a dpsr)i,m st(itdiIdn,B lnotchkr(etahdrse,a d&Irdixn.gx-)>,p rgervo,u p&(rgirnogu-p>)n,e x t| , ^~~~~~~~~~~ args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##p/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL:_562A:L15G:O _warning: #initializer order does not match the declaration order [-Wreorder-ctor]# algo, NCCL_PROTO _562# | # p r o ttoi>d(()t.irdu)n,( &nntchcrleSahdmse(mn.twhorreka)d;s )\, t| i ^d InBloc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hk:(562t:h15r:e anote: dfield 'nthreads' will be initialized after field 'tidInBlock'I dx.x) ,562 | g r o u pt(igdr(otuipd)),, n| t ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~h r e| a tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)d s(nthr e563a | d s ) , sttiedpISniBzleo(cnkc(ctlhSrhemaedmI.dcxo.mxm).,b ugfrfoSuipz(egsr[oNuCpC)L,_ P R| O ^~~~~~~~~~~~~~~~~T O_S/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hI:M562P:L60E:] /note: Nfield 'group' will be initialized after field 'stepSize'C CL_ST E562P | S / s i zteiodf((tTi)d)) ,{ n t| h ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r e a| d group(groups (nthreads),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h :t34i:d7I:n Bnote: lin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereo ck(thread I34d | x . x ) , gprroiumps((gtriodu,p )n,t h r| e ^~~~~~~~~~~a ds, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buff/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hS:i562z:e15s:[ Nwarning: Cinitializer order does not match the declaration order [-Wreorder-ctor]C L_PROTO_SIMPLE]/ N562C | C L _ S TtEiPdS(/tsiidz)e,o fn(tTh)r)e a{d s (| n ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~t h r| e group(groupa ds), tidInBlock/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h(:t34h:r7e:a dnote: Iin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hered x.x), group(gr oup), 34 | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) prims(tid, nthr e563a | d s , &srtienpgS-i>zper(envc,c l&Srhimnegm-.>cnoemxmt.,b uafrfgSsi-z>esse[nNdCbCuLf_fP,R OaTrOg_sS-I>MrPeLcEv]b/uNfCfC,L _aSrTgEsP-S>/rseidzOepoAfr(gT,) )0 ,{ a r| g ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~s - >| c group(groupo nnIndex, args->connIndex); | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h ^: 34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h : 80 : 5p:r inote: min instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested heres (tid, n t80h | r e a d sr,u n&Rriinngg<-T>,p rReevd,O p&,r iPnrgo-t>on>e(xatr,g sa)r;g s -| > ^s endbuff, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ha:r202g:s53-:> rnote: ein instantiation of member function 'RunWorkElement, 1, 2>::run' requested herec vbuff, 202a | r g s - > r e d ORpuAnrWgo,r k0E,l eamregnst-<>Fcno,n nTI,n dReexd,O pa,r gAsl-g>oc,o nPnrIontdoe>x());. r u| n ^( we); /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h| : ^80 :5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11 :801 | : note: in instantiation of member function 'RunWork, 1, 2>::run' requested here runR i11n | gId(uacreg,s )R;I N G| , ^ SIMPLE, S/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hu:m202,: 53f:l onote: ain instantiation of member function 'RunWorkElement, 1, 2>::run' requested heret ) | ^ 202 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 391 :R95u:n Wnote: oexpanded from macro 'IMPL_COLL_FUNC'r kElement <391F | n , RTu,n WRoerdkO,( )t.yrpuen,( wFeu)n;c # #| d ^e vredop1,: Nnote: Cin instantiation of member function 'RunWork, 1, 2>::run' requested hereC L_AL G6O | _I#M#PaLl_gCoO,L LN_CFCULN_CP(RROeTdOu_c#e#,p rRoItNoG>,( )S.IrMuPnL(E&,n cSculmS,h mienmt.3w2o_rtk)) ; | \^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :note: 562expanded from macro 'IMPL_COLL_FUNC': 15: note: field 'nthreads' will be initialized after field 'tidInBlock' 391 | R562u | n W o r ktr,e aNdCICdLx_.AxL)G,O _g#r#oaulpg(og, NCCL_rPoRuOpT)O,_ # #| p ^~~~~~~~~~~~~~~~~r oto>/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:)562.:r60u:n (note: &field 'group' will be initialized after field 'stepSize'n cclShm e562m | . w o r kt)i;d (\t i d| ) ^, nthread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hs:(562n:t15h:r enote: afield 'nthreads' will be initialized after field 'tidInBlock'd s), tid I562n | B l o c kt(tihdr(etaiddI)d,x .nxt)h,r egardosu(pn(tghrroeuapd)s,) , | t ^~~~~~~~~~~i dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx803. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h::56234::157:: warning: note: initializer order does not match the declaration order [-Wreorder-ctor]in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | 562 | p r i m st(itdi(dt,i dn)t,h rnetahdrse,a d&sr(inntgh-r>epardesv),, &triidnIgn-B>lnoecxkt(,t harregasd-I>dsxe.nxd)b,u fgfr,o uapr(ggsr-o>urpe)c,v b u| f ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~f , | a tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)r gs->re d563O | p A r g ,s t0e,p Sairzges(-n>cccolnSnhImnedme.xc,o mamr.gbsu-f>fcSoinzneIsn[dNeCxC)L;_ P R| O ^T O_SIM/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.hP:L80E:]5/:N Cnote: Cin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested hereL _ST E80P | S / s i zreuonfR(iTn)g)< T{, R| e ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~d O p| , group(group Proto>(args); | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h ^: 34:7: note: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here: 202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 34 | 202 | p r i m s (RtuindW,o rnktEhlreemaednst,< F&nr,i nTg,- >RperdeOvp,, &Arlignog,- >Pnreoxtto,> (a)r.grsu-n>(sween)d;b u f| f ^, args->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cppr:e7c:v1b:u fnote: fin instantiation of member function 'RunWork, 1, 2>::run' requested here, arg s7- | >IrMePdLO_pCAOrLgL,_ F0U,N Ca(rRgesd-u>cceo,n nRIInNdGe,x ,S IaMrPgLsE-,> cPornondI,n dueixn)t;3 2 _| t ^) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:: 391note: :in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here95 : note: expanded from macro 'IMPL_COLL_FUNC'80 | run R391i | n g #(#afrugnsc),; t y| p ^e , Func#/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h#:d202e:v53r:e dnote: oin instantiation of member function 'RunWorkElement, 1, 2>::run' requested herep 202, | N C C L _ A L GROu_n#W#oarlkgEol,e mNeCnCtL<_FPnR,O TTO,_ #R#epdrOopt,o >A(l)g.or,u nP(r&ontcoc>l(S)h.mreumn.(wwoer)k;) ; | \ ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h6::5621::15 :note: in instantiation of member function 'RunWork, 1, 2>::run' requested herenote: field 'nthreads' will be initialized after field 'tidInBlock' 6 | 562I | M P L _ CtOiLdL(_tFiUdN)C,( Rnetdhurceea,d sR(InNtGh,r eSaIdMsP)L,E ,t iPdrIondB,l oicnkt(3t2h_rte)a d I| d^x .x), g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:o391u:p95(:g rnote: oexpanded from macro 'IMPL_COLL_FUNC'u p), | ^~~~~~~~~~~~~~~~~ 391 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562R:u60n:W onote: rfield 'group' will be initialized after field 'stepSize'k t,i dNICnCBLl_oAcLkG(Ot_h#r#eaaldgIod,x .NxC)C,L _gPrRoOuTpO(_g#r#opurpo)t,o > (| ) ^~~~~~~~~~~. run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hM:P562L:_15C:O Lwarning: Linitializer order does not match the declaration order [-Wreorder-ctor]_ FUNC(Reduce, RING ,562 | S I M P LtEi,d (Ptriodd),, inntth6r4e_atd)s ( n| t^h reads)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h,: 391t:i95d:I nnote: Bexpanded from macro 'IMPL_COLL_FUNC'l ock(thre a391d | I d xR.uxn)W,o rgkrc,c lNSChCmLe_mA.LcGoOm_m#.#baulfgfoS,i zNeCsC[LN_CPCRLO_TPOR_O#T#Op_rSoItMoP>L(E)]./rNuCnC(L&_nScTcElPSSh/mseimz.ewoofr(kT));) \{ | | ^ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34: 7562: | note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here tid(tid) ,34 | n t h r e a dpsr(inmtsh(rteiadd,s )n,t htriedaIdnsB,l o&crki(ntgh-r>epardeIvd,x .&xr)i,n gg-r>onuepx(tg,r oaurpg)s,- > s| e ^~~~~~~~~~~~~~~~~n dbu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hf:f562,: 60a:r gnote: sfield 'group' will be initialized after field 'stepSize'- >recvb u562f | f , a rtgisd-(>triedd)O,p Anrtgh,r e0a,d sa(rngtsh-r>ecaodnsn)I,n dteixd,I naBrlgosc-k>(ctohnrneIanddIedxx).;x ) ,| ^g roup(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.hg:r80o:u5p:) ,note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here | ^~~~~~~~~~~ 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->coIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nnIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, S 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ IMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(thread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Idx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInoBclko(ctkh(rtehardeIaddxI.dxx).,x )g,r ogurpo(ugpr(ogurpo)u,p ) ,| ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::53562:: 15note: :in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here warning: initializer order does not match the declaration order [-Wreorder-ctor] 202 | RunWorkE l562e | m e n t s()),. rtuind(IwneB)l;o c k| ( ^t hreadId/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cppx:.9x:)1,: gnote: rin instantiation of member function 'RunWork, 1, 2>::run' requested hereo up(g r9o | uIpM)P,L _ C| O ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~L L _| F tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)U NC(Redu c563e | , R I NsGt,e pSSIiMzPeL(En,c cMlaSxh,m eumi.ncto6m4m_.tb)u f f| S^i zes[NC/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hC:L391_:P95R:O Tnote: Oexpanded from macro 'IMPL_COLL_FUNC'_ SIMPLE]/ N391C | C L _RSuTnEWPoSr/ks7,: Nnote: Cin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereC L_ALGO_## a34l | g o , N C CpLr_iPmRsO(TtOi_d#,# pnrtohtroe>a(d)s.,r u&nr(i&nngc-c>lpSrhemve,m .&wroirnkg)-;> n\e x t| , ^ args->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hs:e562n:d15b:u fnote: ffield 'nthreads' will be initialized after field 'tidInBlock', args- >562r | e cv b u ftfi,d (atrigds)-,> rnetdhOrpeAardgs,( n0t,h raeragdss-)>,c otnindIInndBelxo,c ka(rtghsr-e>acdoIndnxI.nxd)e,x )g;r o u| p ^( group)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h,: 80 :| 5 ^~~~~~~~~~~~~~~~~: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :562:60 :80 | note: field 'group' will be initialized after field 'stepSize' runR i562n | g < T , tRiedd(Otpi,d )P,r onttoh>r(eaardgss()n;t h r| e ^a ds), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:i202d:I53n:B lnote: oin instantiation of member function 'RunWorkElement, 1, 2>::run' requested herec k(thr e202a | d I d x . x ) , RgurnoWuopr(kgErloeumpe)n,t < F| n ^~~~~~~~~~~, T, RedOp, Algo, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hPR:O562T:O15_:# #warning: pinitializer order does not match the declaration order [-Wreorder-ctor]r oto>().run(&nc c562l | S h m e mt.iwdo(rtki)d;) ,\ n t| h ^r eads(nt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hh:r562e:a15d:s )note: ,field 'nthreads' will be initialized after field 'tidInBlock' tidInB l562o | c k ( t htrieda(dtIiddx).,x )n,t hgrreoaudps((gnrtohurpe)a,d s )| , ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ t i| d tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)I nBlock (563t | h r e a dsItdexp.Sxi)z,e (gnrcoculpS(hgmreomu.pc)o,m m .| b ^~~~~~~~~~~~~~~~~u ffS/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hi:z562e:s60[:N Cnote: Cfield 'group' will be initialized after field 'stepSize'L _PROTO _562S | I M P L Et]i/dN(CtCiLd_)S,T EnPtSh/rseiazdeso(fn(tTh)r)e a{d s )| , ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ t i| d group(groupI nBlock(thre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.ha:d34I:d7x:. xnote: )in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here, group(gr o34u | p ) , | ^~~~~~~~~~~p rims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidIn/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Block(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connInIn file included from d/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cppe:x1): ;In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h :| 10 ^: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::80562::515:: note: warning: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested hereinitializer order does not match the declaration order [-Wreorder-ctor] 80 | runRin g562< | T , R etdiOdp(,t iPdr)o,t on>t(harregasd)s;( n t| h ^r eads)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h,: 202t:i53d:I nnote: Bin instantiation of member function 'RunWorkElement, 1, 2>::run' requested herel ock(t h202r | e a d I d x . x )R,u ngWroorukpE(lgermoeunpt)<,F n ,| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~T , | R tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)e dOp, Al g563o | , P r osttoe>p(S)i.zreu(nn(cwcel)S;h m e| m ^. comm.b/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cppu:f5f:S1i:z enote: sin instantiation of member function 'RunWork, 1, 2>::run' requested here[ NCCL_ P5R | OITMOP_LS_ICMOPLLLE_]F/UNNCCC(LR_eSdTuEcPeS,/ sRiIzNeGo,f (STI)M)P L{E , | P ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r e M| u group(groupl Sum, uint8_t) | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h^: 34:7: note: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here: 391:95: note: expanded from macro 'IMPL_COLL_FUNC' 34 | 391 | p r iRmusn(Wtoirdk,< nnctchlrFeuandcs#,# f&urnicn,g -t>yppree,v ,F u&nrci#n#gd-e>vnreexdto,p >,s eNnCdCbLu_fAfL,G Oa_r#g#sa-l>groe,c vNbCuCfLf_,P RaOrTgOs_-#>#rperdoOtpoA>r(g),. r0u,n (a&rngcsc-l>SchomnenmI.nwdoerxk,) ;a r\g s -| > ^c onnIn/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:e562x:)15;: note: | field 'nthreads' will be initialized after field 'tidInBlock' ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h :56280 | : 5 : note: tin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested herei d(ti d80) | , n t hrruenaRdisn(gnl(oacrkg(st)h;r e a| d ^I dx.x),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :g202r:o53u:p (note: gin instantiation of member function 'RunWorkElement, 1, 2>::run' requested herer oup), 202 | | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 :R60u:n Wnote: ofield 'group' will be initialized after field 'stepSize'r kEleme n562t | < F n , tTi,d (RteiddO)p,, nAtlhgroe,a dPsr(onttoh>r(e)a.drsu)n,( wtei)d;I n B| l ^o ck(th/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cppr:e4a:d1I:d xnote: .in instantiation of member function 'RunWork, 1, 2>::run' requested herex ), gr o4u | pI(MgPrLo_uCpO)L,L _ F| U ^~~~~~~~~~~N C(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.ht:h34r:e7a:d Inote: din instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested herex .x), group(grou p34) | , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ p| r tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)i ms(tid ,563 | n t h r esatdesp,S i&zrei(nngc-c>lpSrhemve,m .&croimnmg.-b>unfefxSti,z easr[gNsC-C>Ls_ePnRdObTuOf_fS,I MaPrLgEs]-/>NrCeCcLv_bSuTfEfP,S /asrigzse-o>fr(eTd)O)p A{r g ,| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~0 , | a group(groupr gs->connIndex, ar/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.hg:s34-:>7c:o nnote: nin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested hereI ndex); | ^34 | prims/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h(:t80i:d5,: nnote: tin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested hereh read s80, | & r i nrgu-n>Rpirnegv<,T ,& rRiendgO-p>,n ePxrto,t oa>r(gasr-g>ss)e;n d b| u ^f f, args-/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h>:r202e:c53v:b unote: fin instantiation of member function 'RunWorkElement, 1, 2>::run' requested heref , args -202> | r e d O p A r g ,R u0n,W oarrkgEsl-e>mceonntn,c oAnlngIon,d ePxr)o;t o >| ( ^) .run(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.hw:e80):;5 : | note: ^in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp : 11 : 1r:u nnote: Rin instantiation of member function 'RunWork, 1, 2>::run' requested herei ngN(Ca(rRgesd)u;c e ,| ^R ING, SIM/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hP:L202E:,53 :P rnote: ein instantiation of member function 'RunWorkElement, 1, 2>::run' requested hereM ulSu m202, | f l o a t ) R| u^n WorkEle/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hm:e391n:t95<:F note: nexpanded from macro 'IMPL_COLL_FUNC', T, RedO p391, | A lRguon,W oPrrkoc(l)F.urnucn#(#wfeu)n;c , | t ^y pe, Func/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp#:#13d:e1v:r enote: din instantiation of member function 'RunWork, 1, 2>::run' requested hereo pI,M PNLC_CCLO_LALL_GFOU_N#C#(aRlegdou,c eN,C CRLI_NPGR,O TSOI_M#P#LpEr,o tPor>e(M)u.lrSuunm(,& nrccccllS_hbmfelmo.awto1r6k)) ; | \^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hnote: :expanded from macro 'IMPL_COLL_FUNC'562 :15: note: field 'nthreads' will be initialized after field 'tidInBlock' 391 | Ru n562W | o r k < ntcicdl(Ftuindc)#,# fnutnhcr,e atdysp(en,t hFruenacd#s#)d,e vtrieddIonpBt,h rNeCaCdLI_dAxL.GxO)_,# #garloguop,( gNrCoCuLp_)P,R O T| O ^~~~~~~~~~~~~~~~~_ ##p/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:o562t:o60>:( )note: .field 'group' will be initialized after field 'stepSize'r un(&ncc l562S | h m e m .twiodr(kt)i;d )\, n| t ^h reads/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h(:n562t:h15r:e anote: dfield 'nthreads' will be initialized after field 'tidInBlock's ), tid I562n | B l o c kt(itdh(rteiadd)I,d xn.txh)r,e agdrso(unpt(hgrreoaudps)),, t| i ^~~~~~~~~~~d InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h, :N562C:C15L:_ Pwarning: Rinitializer order does not match the declaration order [-Wreorder-ctor]O TO_##proto>(). r562u | n ( & n ctcildS(htmiedm).,w onrtkh)r;e a\d s (| n ^t hread/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hs:)562,: 15t:i dnote: Ifield 'nthreads' will be initialized after field 'tidInBlock'n Block( t562h | r e a d Itdixd.(xt)i,d )g,r onutph(rgeraodusp()n,t h r| e ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~a d s| ) tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T), tidInB l563o | c k ( t hsrteeapdSIidzxe.(xn)c,c lgSrhomuepm(.gcroomump.)b,u f f| S ^~~~~~~~~~~~~~~~~i zes/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h[:N562C:C60L: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | p/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx900. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 80 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(Reduce, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h_:t*514 :p9t:r warning: =variable 'offset' set but not used [-Wunused-but-set-variable] recvPt r514( | 0 ) + l li1n2t8 Ooffffsseett; = | t ^~~i d; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wiIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ reOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx90a. 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx908. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx940. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h :153514 | : 9 : warning: uvariable 'offset' set but not used [-Wunused-but-set-variable]i nt32_t d a514t | a 1 , filnta go1f,f sdeatt a=2 ,t ifdl;a g 2| ; ^ | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx1030. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 13 warnings generated when compiling for gfx90a. 13 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.hIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ :271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cppwarp(t:i1d: /WIn file included from A/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.hR:P10_: SIn file included from I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.hZ:E169): , /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h| : ~~~~~~~~~~~~~~~~~~509 : 29| : warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBloc k507( | t h r e atdiIdd(xt.ixd/)W,A RnPt_hSrIeZaEd)s,( n t| h ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r e a| d warp(tid/WARP_SIZEs ), wi d509( | t i d % WfAlRaPg_TShIrZeEa)d,( (wtairdp%(4t)i=d=/3W)A,R Pg_rSoIuZpE()g,r o u| p ~~~~~~~~~~~~~~~~~~) , | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)| ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 508 | 510w | a r p I nsBtleopcSki(zteh(rnecacdlISdhxm.exm/.WcAoRmPm_.SbIuZfEf)S,i z e| s ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~[ N C| C warp(tid/WARP_SIZEL _PROT O509_ | L L 1 2 8f]l/aNgCTChLr_eSaTdE(P(St/isdi%z4e)o=f=(3u)i,n tg6r4o_utp)()g r{o u p| ) ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~, | | group(group ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h :s33t:e7p:S inote: zin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested heree (ncclShme m33. | c o m m . b upfrfiSmisz(etsi[dN,C CnLt_hPrReOaTdOs_,L L&1r2i8n]g/-N>CpCrLe_vS,T E&PrSi/nsgi-z>enoefx(tu,i natr6g4s_-t>)s)e n{d b u| f ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~f , | a group(groupr gs->recvbuff, args->redOp/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.hA:r33g:,7 :0 ,note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested herea rgs->connI n33d | e x , a r gpsr-i>mcso(ntniIdn,d enxt)h;r e a| d ^s , &ri/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.hn:g92-:>5p:r enote: vin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here, &ri n92g | - > n e xrtu,n Rairnggs<-T>,s eRneddbOupf,f ,P raortgosL-L>1r2e8c>v(baurfgfs,) ;a r g| s ^- >redOpA/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:g202,: 530:, note: ain instantiation of member function 'RunWorkElement, 1, 1>::run' requested herer gs->c o202n | n I n d e x , aRrugnsW-o>rckoEnlneImnednetx<)F;n , | T ^, RedO/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.hp:,92 :A5l:g onote: ,in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here Prot o92 | > ( ) . rruunn(Rwien)g;< T ,| ^R edOp, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cppP:r13o:t1o:L Lnote: 1in instantiation of member function 'RunWork, 1, 1>::run' requested here2 8>(a r13g | sI)M;P L _| C ^O LL_FUNC(R/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:d202u:c53e: Snote: cin instantiation of member function 'RunWorkElement, 1, 1>::run' requested herea tter, 202R | I N G , L L 1 2R8u,n WPorrekMEulleSmuemn,t () .391r | u n (Rwuen)W;o r k| < ^n cclFun/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cppc:#8#:f1u:n cnote: ,in instantiation of member function 'RunWork, 1, 1>::run' requested here type, 8F | uInMcP#L#_dCeOvLrLe_dFoUpNu,c eNSCcCaLt_tAeLrG,O _R#I#NaGl,g oL,L 1N2C8C,L _PPrReOMTuOl_S#u#mp,r oution>t(3)2._rtu)n ( &| n^c clShme/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hm:.391w:o95r:k )note: ;expanded from macro 'IMPL_COLL_FUNC' \ | ^ 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:92:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 92 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | IMPL_COLL_FUNC(ReduceScatter, RING, LL128, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ 7 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1102. 7 warnings generated when compiling for gfx900. 7 warnings generated when compiling for gfx908. 7 warnings generated when compiling for gfx940. 7 warnings generated when compiling for gfx1101. 7 warnings generated when compiling for gfx906. 7 warnings generated when compiling for gfx803. 7 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 7 warnings generated when compiling for host. 7 warnings generated when compiling for gfx942. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx90a. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:216:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 216 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:216:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 216 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:216:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 216 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:216:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 216 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:212:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 212 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:216:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 216 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:228:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 228 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:228:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 228 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:228:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 228 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:228:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 228 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:228:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 228 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:224:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 224 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:216:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 216 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:216:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 216 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:212:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 212 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:228:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 228 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:224:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 224 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:228:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 228 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1030. 9 warnings generated when compiling for gfx1102. 9 warnings generated when compiling for gfx906. 9 warnings generated when compiling for gfx900. 9 warnings generated when compiling for gfx908. 9 warnings generated when compiling for gfx940. 9 warnings generated when compiling for gfx1101. 9 warnings generated when compiling for gfx90a. 9 warnings generated when compiling for gfx941. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx803. 9 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:216:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 216 | runRecv>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/sendrecv.h:228:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 228 | runSend>(tid, nthreads, group, args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(SendRecv, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ TEPS>, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPSIn file included from //usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpps:i1z: e/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.ho:f154(:u10i:n twarning: 6variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized]4 _t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group154 | case /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h3::217 : 57| : ^ note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primiti/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cppv:e5s:<9T:, note: Rin instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested heree dOp, F a5n | A s y m m e t r iMcSI,M P1L,_ KPErRoNtEoL,_ E0N>T RpYr_iFmUsN C _| D ^E VRED/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cppO:P5_:T9Y:P Enote: (in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested hereS um, u i5n | t 8 _ t , f a lMsSeC)C;L _ I| M ^P L_KER/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hN:E399L:_3E:N Tnote: Rexpanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'Y _FUNC_ D399E | V R EmDsOcPc_lTRYuPnEI(nStuemr,p rueitnetr8<_tty,p ef,a lFsuen)c;# # d| e ^v red/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.ho:p402<:t3y:p enote: >expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE', Proto L402L | , fmuslclcOlpRsu>n(Icnotmemr,p reter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: :variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized]154 :10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3154: | | ^ case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:: 5note: :in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here9 : note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | 5 | M S C C LM_SICMCPLL__IKMEPRLN_EKLE_RENNETLR_YE_NFTURNYC__FDUENVCR_EDDEOVPR_ETDYOPPE_(TSYuPmE,( Suuimn,t 8u_itn,t 8f_atl,s ef)a;l s e| ) ^; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h::399402::33:: note: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399402 | | mmssccccllRRuunnIInntteerrpprreetteerr<>,, PPrroottooLLLL,1 2f8u,l lfOuplsl>O(pcso>m(mc,o maml,g oa,l gwoo,r kw)o;r k\) ; | \ ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h::165165::3333:: note: note: uninitialized use occurs hereuninitialized use occurs here 165 | 165 | c ocpoypTyoTSohSmhemme8m(8t(itdi%dW%AWRAPR_PS_ISZIEZ,E ,d sdts,t ,s rscr,c ,b ybtyetse)s;) ; | ^~~| ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h::5162:: 5warning: :variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | 162 | d e fdaeuflatu:l t :| ^~~~~~~ | ^~~~~~~/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h :165/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h::33165:: 33note: :uninitialized use occurs here note: uninitialized use occurs here 165 | 165 | c o pcyoTpoySThomSehmm8e(mt8i(dt%iWdA%RWPA_RSPI_ZSEI,Z Ed,s td,s ts,r cs,r cb,y tbeyst)e;s ) ;| ^~~ | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h :134:14 :134 | note: initialize the variable 'dst' to silence this warning vo i134d | * d s tv,o i*ds r*cd;s t , *sr| ^ | = nullptr c; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wi/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ d(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ c##devredop, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_ST/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ EPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx941. 13 warnings generated when compiling for gfx908. 13 warnings generated when compiling for gfx940. 13 warnings generated when compiling for gfx90a. 13 warnings generated when compiling for gfx90a. 13 warnings generated when compiling for gfx803. 13 warnings generated when compiling for gfx1030. 13 warnings generated when compiling for gfx906. 13 warnings generated when compiling for gfx1100. 13 warnings generated when compiling for gfx1101. 13 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 13 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for host. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, SumPostDiv, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 13 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ devredop, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roup(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx803. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Sum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid) ,562 | n t h r etaidds((tnitdh)r,e andtsh)r,e atdisd(InntBhlroecakd(st)h,r etaiddIIdnxB.lxo)c,k (gtrhoruepa(dgIrdoxu.px)),, g| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~o u p| ( tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)g roup), 563 | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | s tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)t epSize (563n | c c l S hsmteemp.Sciozmem(.nbcucflfSShimzeems.[cNoCmCmL._bPuRfOfTSOi_zSeIsM[PNLCEC]L/_NPCRCOLT_OS_TSEIPMSP/LsEi]z/eNoCfC(LT_)S)T E{P S /| s ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~i z e| o group(groupf (T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h::3333::77:: note: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested herein instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 3333 | | pprriimmss((ttiidd,, nntthhrreeaaddss,, &&rriinngg-->>pprreevv,, &&rriinngg-->>nneexxtt,, aarrggss-->>sseennddbbuuffff,, aarrggss-->>rreeccvvbbuuffff,, aarrggss-->>rreeddOOppAArrgg,, 00,, aarrggss-->>ccoonnnnIInnddeexx,, aarrggss-->>ccoonnnnIInnddeexx));; | | ^ ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h::7878::55:: note: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested herein instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 7878 | | rruunnRRiinngg<>((aarrggss));; | | ^ ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h202::20253::53 : note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here202 | 202 | R u n W o r kREulneWmoernktE (P)r.ortuon>((w)e.)r;u n (| w ^e ); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cppin instantiation of member function 'RunWork, 1, 2>::run' requested here: 5:1: note: 5in instantiation of member function 'RunWork, 1, 2>::run' requested here | IMPL _5C | OILMLP_LF_UCNOCL(LR_eFdUuNcCe(SRceadtutceerS,c aRtItNeGr,, SRIIMNPGL,E ,S IPMrPoLdE,, uPirnotd8,_ tu)i n t| 8^_ t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h95::391 :note: 95expanded from macro 'IMPL_COLL_FUNC': note: expanded from macro 'IMPL_COLL_FUNC' 391 | 391R | u n WRournkWy,p eN>C,C LN_CACLLG_OA_L#G#Oa_l#g#oa,l gNoC,C LN_CPCRLO_TPOR_O#T#Op_r#o#tpor>o(t)o.>r(u)n.(r&unnc(c&lnSchcmleSmh.mweomr.kw)o;r k\) ; | \ ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::562562::1515:: note: note: field 'nthreads' will be initialized after field 'tidInBlock'field 'nthreads' will be initialized after field 'tidInBlock' 562562 | | ttiidd((ttiidd)),, nntthhrreeaaddss((nntthhrreeaaddss)),, ttiiddIInnBBlloocckk((tthhrreeaaddIIddxx..xx)),, ggrroouupp((ggrroouupp)),, | | ^~~~~~~~~~~~~~~~~ ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::562562::6060:: note: note: field 'group' will be initialized after field 'stepSize'field 'group' will be initialized after field 'stepSize' 562562 | | ttiidd((ttiidd)),, nntthhrreeaaddss((nntthhrreeaaddss)),, ttiiddIInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h : 562 :R15u:n Wwarning: oinitializer order does not match the declaration order [-Wreorder-ctor]r kElemente(a)d.sr(unnt(hwree)a;d s )| , ^ tidInBl/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cppo:c7k:(1t:h rnote: ein instantiation of member function 'RunWork, 1, 2>::run' requested herea dIdx .7x | )I,M PgLr_oCuOpL(Lg_rFoUuNpC)(,R e d| u ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~c e S| c tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)a tter, R563I | N G , SsItMePpLSEi,z eP(rnocdc,l Suhimnetm3.2c_otm)m . b| u^f fSizes[N/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hC:C391L:_95P:R Onote: Texpanded from macro 'IMPL_COLL_FUNC'O _SIMPLE] /391N | C C LR_uSnTWEoPrSk/, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested herep e>, NCCL _ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nth33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(Redu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ MPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Prod, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, w/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ork); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hZ:E154,: 10d:s twarning: ,variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] src, byte s154) | ; | ^~~c ase 3:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h : 162| : ^5 : warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp :d5e:f9a:u lnote: tin instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h5: | 165 : 33 : note: uninitialized use occurs here MSCC L165_ | I M P L _cKoEpRyNTEoLS_hEmNeTmR8Y(_tFiUdN%CW_ADREPV_RSEIDZOEP,_ TdYsPtE,( Ssurmc,, ibnytt3e2s_)t;, f| a ^~~l se); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h::134162::145:: note: warning: initialize the variable 'dst' to silence this warningvariable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162134 | | dveofiadu l*td:s t ,| ^~~~~~~* sr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hc:;165 : 33| : ^ note: uninitialized use occurs here| = nullptr 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] In file included from 271 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp : 1u: inIn file included from t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h6:410_: tIn file included from */usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h :p169t: r =/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h :r271e:c19v:P twarning: runused variable 'ptr' [-Wunused-variable]( 0)+ll128Offset; | ^~~ 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.hi:n386t: 9w:i rwarning: evariable 'wireOffset' set but not used [-Wunused-but-set-variable]O ffset = 386W | i r e W oirndtP ewriSrleiOcfef*sweatr p= +W i2r*ewWiodr;d P e| r ^S lice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLLIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hthreadI:d562x:.15x:) ,warning: initializer order does not match the declaration order [-Wreorder-ctor]g roup(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: 562field 'group' will be initialized after field 'stepSize' | t i562d | ( t i d )t,i dn(tthirde)a,d sn(tnhtrheraedasd(sn)t,h rteiaddIsn)B,l otcikd(ItnhBrleoacdkI(dtxh.rxe)a,d Igdrxo.uxp)(,g rgoruopu)p,( g r| o ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~u p )| , tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) | ^~~~~~~~~~~ 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h<:F562n:,15 :T ,warning: initializer order does not match the declaration order [-Wreorder-ctor]R edOp, Algo, Proto>( )562. | r u n ( wtei)d;( t i| d ^) , nthrea/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cppd:s9(:n1t:h rnote: ein instantiation of member function 'RunWork, 1, 2>::run' requested herea ds), 9t | iIdMIPnLB_lCoOcLkL(_tFhUrNeCa(dRIeddxu.cxe)S,c agtrtoeurp,( gRrIoNuGp,) ,S I M| P ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~L E ,| tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)M ax, ui n563t | 6 4 _ t )s t e| p^S ize(n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hc:c391l:S95h:m enote: mexpanded from macro 'IMPL_COLL_FUNC'. comm.buf f391S | i z eRsu[nNWCoCrLk_ ,| group(groupN CCL_ALGO_##algo, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.hN:C33:C7L:_ Pnote: Rin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested hereO TO_##prot o33> | ( ) . r upnr(i&mnsc(ctliSdh,m enmt.hwroerakd)s;, \& r i| n ^g ->pre/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hv:,562 :&15r:i nnote: gfield 'nthreads' will be initialized after field 'tidInBlock'- >next, 562 | a r g s -t>isde(ntdibdu)f,f ,n tahrrgesa-d>sr(enctvhbruefafd,s )a,r gtsi-d>IrneBdlOopcAkr(gt,h r0e,a daIrdgxs.-x>)c,o ngnrIonudpe(xg,r oaurpg)s,- > c| o ^~~~~~~~~~~~~~~~~n nIn/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hd:e562x:)60;: note: | field 'group' will be initialized after field 'stepSize' ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h562: | 78 : 5 : tnote: iin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested hered (t i78d | ) , n trhurneRaidnsg(B(laorcgks()t;h r e| a ^d Idx.x/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h):,202 :g53r:o unote: pin instantiation of member function 'RunWorkElement, 1, 2>::run' requested here( group )202, | | ^~~~~~~~~~~ RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max ,562 | ha l f ) t i| d^( tid), nthreads(nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hr:e391a:d95s:) ,note: expanded from macro 'IMPL_COLL_FUNC't idInBlock(thre a391d | I d xR.uxn)W,o rgkrn,c cNlCSChLm_eAmL.GcOo_m#m#.ablugfof,S iNzCeCsL[_NPCRCOLT_OP_R#O#TpOr_oStIoM>P(L)E.]r/uNnC(C&Ln_cScTlESPhSm/esmi.zweoorfk()T;) )\ { | ^| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h | : 33 : 7 :t inote: din instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here( tid), nthr e33a | d s ( n t h rperaidmss)(,t itdi,d InntBhlroecakd(st,h r&eraidnIgd-x>.pxr)e,v ,g r&oruipn(gg-r>onuepx)t,, a| r ^~~~~~~~~~~~~~~~~g s->/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hs:e562n:d60b:u fnote: ffield 'group' will be initialized after field 'stepSize', args- >562r | e c v b utfifd,( tairdg)s,- >nrtehdrOepaAdrsg(,n t0h,r eaardgss)-,> ctoindnIInnBdleoxc,k (atrhgrse-a>dcIodnxn.Ixn)d,e xg)r;o u p| ( ^g roup),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h : 78| : ^~~~~~~~~~~5 : note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceSc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ha:t562t:e15r:, warning: Rinitializer order does not match the declaration order [-Wreorder-ctor]I NG, SIMPLE, Ma x562, | r c c lt_ibdf(ltoiadt)1,6 )n t h| r^e ads(nthreads), tidInB/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hl:o391c:k95(:t hnote: rexpanded from macro 'IMPL_COLL_FUNC'e adIdx.x), grou p391( | g r oRuupn)W,o r k| < ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~n c c| l tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)F unc##f u563n | c , t ysptee,p SFiuznec(#n#cdcelvSrhemdeomp.b,u fNfCSCiLz_eAsL[GNOC_C#L#_aPlRgOoT,O _NSCICMLP_LPER]O/TNOC_C#L#_pSrToEtPoS>/(s)i.zreuonf((&Tn)c)c l{S h m| e ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~m . w| o group(groupr k); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h33: | 562 : 15 : note: field 'nthreads' will be initialized after field 'tidInBlock'p rims(tid ,562 | n t h r etaidds(,t i&dr)i,n gn-t>hprreeavd,s (&nrtihnrge-a>dnse)x,t ,t iadrIgnsB-l>oscekn(dtbhurfefa,d Iadrxg.sx-)>,r egcrvobuupf(fg,r oaurpg)s,- > r| e ^~~~~~~~~~~~~~~~~d OpA/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:g562,: 600:, note: afield 'group' will be initialized after field 'stepSize'r gs->co n562n | I n d e xt,i da(rtgisd-)>,c onntnhIrnedaedxs)(;n t h| r ^e ads),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h :t78i:d5I:n Bnote: lin instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested hereo ck( t78h | r e a d Irduxn.Rxi)n,g ^~~~~~~~~~~( args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx1101. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx803. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1100. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMax<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Max, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h::110: : In file included from In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h::10167: : In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h::562167:: 15/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:: 562warning: :initializer order does not match the declaration order [-Wreorder-ctor]15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | 562t | i d ( t itdi)d,( tnitdh)r,e andtsh(rnetahdrse(andtsh)r,e atdisd)I,n BtliodcIkn(Btlhorceka(dtIhdrxe.axd)I,d xg.rxo)u,p (ggrroouupp()g,r o u| p ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~) , | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | 563s | t e p S isztee(pnSciczleS(hnmcecml.Schommemm..bcuofmfmS.ibzuefsf[SNiCzCeLs_[PNRCOCTLO__PSRIOMTPOL_ES]I/MNPCLCEL]_/SNTCECPLS_/SsTiEzPeSo/fs(iTz)e)o f{( T )| ) ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ { | group(group| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h :note: 33in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here: 7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | p r33i | m s ( t i d ,p rnitmhsr(etaidds,, n&trhirnega-d>sp,r e&vr,i n&gr-i>npgr-e>vn,e x&tr,i nagr-g>sn-e>xste,n dabrugfsf-,> saerngdsb-u>frfe,c vabrugfsf-,> raercgvsb-u>frfe,d OaprAgrsg-,> r0e,d OaprAgrsg-,> c0o,n naIrngds-e>xc,o nanrIgnsd-e>xc,o nanrIgnsd-e>xc)o;n n I| n ^d ex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h5::78 :note: 5in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | 78 | r u n R irnugnr(oatrog>s()a;r g s| ) ^; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:: 202note: :in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here53 : note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | 202 | R u n W oRruknEWloermkeEnlter(o)t.or>u(n)(.wreu)n;( w e| ) ^; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:: 4note: :in instantiation of member function 'RunWork, 1, 2>::run' requested here1 : note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMP L4_ | CIOMLPLL__FCUONLCL(_RFeUdNuCc(eReSdcuactetSecra,t tReIrN,G ,R ISNIGM,P LSEI,M PMLiEn,, Miinnt,8 _itn)t 8_ t| )^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h::95391:: 95note: :expanded from macro 'IMPL_COLL_FUNC' note: expanded from macro 'IMPL_COLL_FUNC' 391 | 391 | R u nRWuonrWkop,e >N,C CNLC_CALL_GAOL_G#O#_a#l#gaol,g oN,C CNLC_CPLR_OPTROO_T#O#_p#r#optroo>t(o)>.(r)u.nr(u&nn(c&cnlcSchlmSehmm.ewmo.rwko)r;k )\; \| ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h::15562:: 15note: :field 'nthreads' will be initialized after field 'tidInBlock' note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | 562 | t i dt(itdi(dt)i,d )n,t hnrtehardesa(dnst(hnrtehardesa)d,s )t,i dtIindBIlnoBclko(cthreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ k(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_ST/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ EPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->con/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hN:C562C:L15_:A Lwarning: Ginitializer order does not match the declaration order [-Wreorder-ctor]O _##algo, NCCL_PR O562T | O _ # # ptriodt(ot>i(d)).,r unnt(h&rnecacdlsS(hnmtehmr.ewaodrsk)),; t\i d I| n ^B lock(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ht:h562r:e15a:d Inote: dfield 'nthreads' will be initialized after field 'tidInBlock'x .x), g r562o | u p ( g rtoiudp()t,i d )| , ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ n t| h tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)r eads(n t563h | r e a stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShme/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hm:.c562o:m15m:. bwarning: uinitializer order does not match the declaration order [-Wreorder-ctor]f fSizes[NCCL_PRO T562O | _ S I M PtLiEd](/tNiCdC)L,_ SnTtEhPrSe/asdisz(enotfh(rTe)a)d s{) , | t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~i d I| n group(groupB lock(threadIdx.x), g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.hr:o33u:p7(:g rnote: oin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested hereu p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | 33 tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) | p r563i | m s ( t isdt,e pnStihzree(andcsc,l S&hrmienmg.-c>opmrme.vb,u f&frSiinzge-s>[nNeCxCtL,_ PaRrOgTsO-_>SsIeMnPdLbEu]f/fN,C CaLr_gSsT-E>PrSe/csvibzuefoff,( Ta)r)g s{- > r| e ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~d O p| A group(groupr g, 0, args-/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h>:c33o:n7n:I nnote: din instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested heree x, args-> c33o | n n I n d e xp)r;i m s| ( ^t id, n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.ht:h78r:e5a:d snote: ,in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here &rin g78- | > p r e vr,u n&Rriinngg<-T>,n eRxetd,O pa,r gPsr-o>tsoe>n(dabrugfsf),; a r| g ^s ->recv/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hb:u202f:f53,: anote: rin instantiation of member function 'RunWorkElement, 1, 2>::run' requested hereg s->re d202O | p A r g , 0 , RaurngWso-r>kcEolnenmIenndteecdoOnpn,I nAdlegxo),; P r| o ^t o>()./usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.hr:u78n:(5w:e )note: ;in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here | ^ 78 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cppr:u12n:R1i:n gnote: , 1, 2>::run' requested hereT , Red O12p | ,I MPPrLo_tCoO>L(La_rFgUsN)C;( R e| d ^u ceScat/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:e202r:,53 :R Inote: Nin instantiation of member function 'RunWorkElement, 1, 2>::run' requested hereG , SIM P202L | E , M i n , dRouunbWloer)k E l| e^m entn(W)o.rrku, 1, 2>::run' requested herec ##dev r10e | dIoMpPL,_ FNUCNCCL(_RAeLdGuOc_e#S#caaltgtoe,r ,N CRCILN_GP,R OSTIOM_P#L#Ep,r oMtion>,( )h.arlufn)( & n| c^c lShme/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hm:.391w:o95r:k )note: ;expanded from macro 'IMPL_COLL_FUNC' \ | ^ 391 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :R562u:n15W:o rnote: kfield 'nthreads' will be initialized after field 'tidInBlock'< ncclFu n562c | # # f u ntci,d (ttyipde),, Fnutnhcr#e#addesv(rnetdhorpe ,t iNdCICnLB_lAoLcGkO(_t#h#raelagdoI,d xN.CxC)L,_ PgRrOoTuOp_(#g#rporuopt)o,> ( )| . ^~~~~~~~~~~~~~~~~r un(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h&:n562c:c60l:S hnote: mfield 'group' will be initialized after field 'stepSize'e m.work )562; | \ | t ^i d(tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h):,562 :n15t:h rnote: efield 'nthreads' will be initialized after field 'tidInBlock'a ds(nth r562e | a d s ) ,t itdi(dtIindB)l,o cnkt(htrheraedasd(Indtxh.rxe)a,d sg)r,o utpi(dgIrnoBulpo)c,k ( t| h ^~~~~~~~~~~r eadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork,, nNtChCrLe_aAdLsG(On_t#h#raelagdos,) ,N CtCiLd_IPnRBOlToOc_k#(#tphrroetaod>I(d)x..rxu)n,( &gnrcoculpS(hgmreomu.pw)o,r k )| ; ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ \ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h563: | 562 : 15 : snote: tfield 'nthreads' will be initialized after field 'tidInBlock'e pSize( n562c | c l S h mteimd.(ctoimdm).,b unftfhSriezaedss[(NnCtChLr_ePaRdOsT)O,_ StIiMdPILnEB]l/oNcCkC(Lt_hSrTeEaPdSI/dsxi.zxe)o,f (gTr)o)u p{( g r| o ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~u p )| , group(group | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.hfield 'group' will be initialized after field 'stepSize': 33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here562 | tid( t33i | d ) , n t hprreiamdss((tnitdh,r enatdhsr)e,a dtsi,d I&nrBilnogc-k>(ptrherve,a d&Irdixn.gx-)>,n egxrto,u pa(rggrso-u>ps)e,n d b| u ^~~~~~~~~~~f f, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ T, RedOp, Algo, Proto>().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx941. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx940. 17 warnings generated when compiling for gfx1102. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx803. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMin<__half>, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, Min, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYP/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' E(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tidIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr (tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp : 1u: iIn file included from n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.ht:3132: _In file included from t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h :d168a: t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.ha:1153,: 14f:l awarning: gunused variable 'data1' [-Wunused-variable]1 , data2, flag2; | ^~~~~ 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groupIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##p/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInB/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hon:n562I:n15d:e xwarning: )initializer order does not match the declaration order [-Wreorder-ctor]; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 562 | 78 | t i d (rtuindR)i,n gn)(,a rtgisd)I;n B l| o ^c k(thr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.he:a202d:I53d:x .note: xin instantiation of member function 'RunWorkElement, 1, 2>::run' requested here) , gro u202p | ( g r o u p ) , R u| n ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~W o r| k tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)E lement <563F | n , T ,s tReepdSOipz,e (Anlcgcol,S hPmreomt.oc>o(m)m..rbuunf(fwSei)z;es [ N| CC ^L _PROTO_S/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cppI:M7P:L1E:] /note: Nin instantiation of member function 'RunWork, 1, 2>::run' requested hereC CL_S T7E | PISM/PsLi_zCeOoLfL(_TF)U)N C{( R e| d ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~u c e| S group(groupc atter, RING, SIMPL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.hE:,33 :P7r:e Mnote: uin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested herel Sum, uint 3332 | _ t ) | ^p rims(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.ht:i391d:,95 :n tnote: hexpanded from macro 'IMPL_COLL_FUNC'r eads, & r391i | n g -R>upnrWeovr,k <&nrcicnlgF-u>nnce#x#tf,u nacr,g st-y>psee,n dFbuunfcf#,# daervgrse-d>orpef,, NaCrCgLs_-A>LrGeOd_O#p#Aarlgg,o ,0 ,N CaCrLg_sP-R>OcToOn_n#I#npdreoxt,o >a(r)g.sr-u>nc(o&nnncIcnldSehxm)e;m . w| o ^r k); \/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h : 78| : ^5 : note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562 :7815 | : note: field 'nthreads' will be initialized after field 'tidInBlock' runRin g562< | T , R etdiOdp(,t iPdr)o,t on>t(harregasd)s;( n t| h ^r eads),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :t202i:d53I:n Bnote: lin instantiation of member function 'RunWorkElement, 1, 2>::run' requested hereo ck(t h202r | e a d I d x . x )R,u ngWroorukpE(lgermoeunpt)<,F n ,| ^~~~~~~~~~~~~~~~~T , R/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:d562O:p60,: Anote: lfield 'group' will be initialized after field 'stepSize'g o, Pr o562t | o > ( ) .triudn((twied));, n| t ^h reads/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp(:n6t:h1r:e anote: din instantiation of member function 'RunWork, 1, 2>::run' requested heres ), ti d6I | nIBMlPoLc_kC(OtLhLr_eFaUdNICd(xR.exd)u,c egSrcoautpt(egrr,o uRpI)N,G , | S ^~~~~~~~~~~I MPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hnote: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here: 562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 33 | prims (562t | i d , nttihdr(etaidds),, &nrtihnrge-a>dpsr(envt,h r&eraidnsg)-,> nteixdtI,n Balrogcsk-(>tshernedabduIfdfx,. xa)r,g sg-r>oruepc(vgbruofufp,) ,a r g| s ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~- > r| e tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)d OpArg, 0563, | a r g ss-t>ecpoSninzIen(dnecxc,l Sahrmgesm-.>ccoomnmn.IbnudfefxS)i;z e s| [ ^N CCL_PR/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.hO:T78O:_5S:I Mnote: Pin instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested hereL E]/N C78C | L _ S T ErPuSn/Rsiinzge (args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7:/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h :note: 202in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here: 53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 33 | 202 | p r i m s ( t iRdu,n WnotrhkrEelaedmse,n t&,p rReevd,O p&,r iAnlgg-o>,n ePxrto,t oa>r(g)s.-r>usne(nwdeb)u;f f ,| ^a rgs->re/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cppc:v10b:u1f:f ,note: in instantiation of member function 'RunWork, 1, 2>::run' requested herea rgs-> r10e | dIOMpPALr_gC,O L0L,_ FaUrNgCs(-R>ecdouncneISncdaetxt,e ra,r gRsI-N>Gc,o nSnIIMnPdLeEx,) ;P r e| M ^u lSum/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h,: 78h:a5l:f )note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here | ^ 78 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h : 391 :r95u:n Rnote: iexpanded from macro 'IMPL_COLL_FUNC'n gr(ka, 1, 2>::run' requested hereu nc##d e202v | r e d o p < t y pReu>n,W oNrCkCELl_eAmLeGnOt_<#F#na,l gTo,, RNeCdCOLp_,P RAOlTgOo_,# #Pprroottoo>>(())..rruunn((w&en)c;c l S| h ^m em.wor/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cppk:)12;: 1\: note: | in instantiation of member function 'RunWork, 1, 2>::run' requested here ^ 12/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h | :I562M:P15L:_ Cnote: Ofield 'nthreads' will be initialized after field 'tidInBlock'L L_FUNC (562R | e d u c etSicda(tttiedr),, RnItNhGr,e aSdIsM(PnLtEh,r ePardesM)u,l Stuimd,I ndBoluobclke()t h r| e^a dIdx./usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.hx:)391,: 95g:r onote: uexpanded from macro 'IMPL_COLL_FUNC'p (group), 391 | | ^~~~~~~~~~~~~~~~~ Run/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hW:o562r:k60<:n cnote: cfield 'group' will be initialized after field 'stepSize'l Func## f562u | n c , ttyipde(,t iFdu)n,c #n#tdherveraeddso(pnd,s )N,C CtLi_dAILnGBOl_o#c#ka(ltghor,e aNdCICdLx_.PxR)O,T Og_r#o#uppr(ogtroo>u(p)).,r u n| ( ^~~~~~~~~~~& ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx908. 17 warnings generated when compiling for gfx90a. 17 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1101. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx940. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:10: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint8_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint32_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, int64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, uint64_t) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, half) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, float) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, double) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/reduce_scatter.h:78:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 78 | runRing(args); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | IMPL_COLL_FUNC(ReduceScatter, RING, SIMPLE, PreMulSum, rccl_bfloat16) | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/common.h:391:95: note: expanded from macro 'IMPL_COLL_FUNC' 391 | RunWork, NCCL_ALGO_##algo, NCCL_PROTO_##proto>().run(&ncclShmem.work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. 17 warnings generated when compiling for gfx1030. 17 warnings generated when compiling for gfx803. 17 warnings generated when compiling for gfx906. 17 warnings generated when compiling for gfx900. 17 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, In file included from u/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cppi:n1t: 6In file included from 4/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h_:t13,: In file included from f/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.ha:l169s: e/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h):;509 : 29| : ^ warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 507 | tid (405t | i d )m,s cnctlhRruenaIdnst(enrtphrreetaedrs<)t,y pwei,d (Ftuindc%#W#deAvRrPe_dSoIpZa,r pP(rtoitdo/SWiAmRpPl_eSP,_ SfIuZlEl)O,p s >| ( ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~c o m| m warp(tid/WARP_SIZE, algo ,509 | w o r k )f;l a\g T h| r ^e ad((/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.ht:i165d:%334:) =note: =uninitialized use occurs here3 ), grou p165( | g r o u pc)o,p y T| o ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~S h m| e warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3m 8(tid%W A510R | P _ S I ZsEt,e pdSsitz,e (snrccc,l Sbhymteems.)c;o m m| . ^~~b uffSize/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hs:[162N:C5C:L _warning: Pvariable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized]R OTO _162L | L 1 2 8 ]d/eNfCaCuLl_tS:T E P| S ^~~~~~~/ si/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hz:e165o:f33(:u inote: nuninitialized use occurs heret 64_t) )165 | { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~c o p| y group(groupT oShmem8(t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hi:d217%:W57A:R Pnote: _in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested hereS IZE, d217s | t , Psrricm,i tbiyvteess<)T;, R| e ^~~d Op, FanAsymmetric<1,1>, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h402: | 134 : 14m:s cnote: cinitialize the variable 'dst' to silence this warningl RunIn t134e | r p r e tveori
, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false)In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr ; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives:,154 :110,: Pwarning: rvariable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized]o to, 0> prims 154 | | ^ cas/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cppe: 53::9 : | note: ^in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp_:I5M:P9L:_ Knote: Ein instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested hereR NEL_EN 5T | R Y _ F U N C _ DMESVCRCELD_OIPM_PTLY_PKE(ESRuNmE,L _fElNoTaRtY,_ FfUaNlCs_eD)E;V R E| D ^O P_TY/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hP:E405(:S3u:m ,note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'f loat, fal s405e | ) ; m s| c ^c lRunI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hn:t399e:r3p:r enote: texpanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'e re,r P,S /PMrSoCtCoLL_LSL,I CfEuSlTlEOPpSs,> (McSoCmCmL,_ SaLlIgCoE,S TwEoPrS>k,) ;f u\l l O| p ^s >(comm, a/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hl:g165o:,33 :w onote: runinitialized use occurs herek ); \ | ^165 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hc:o562p:y15T:o Snote: hfield 'nthreads' will be initialized after field 'tidInBlock'm em8(ti d562% | W A R P _tSiIdZ(Et,i dd),s tn,t hsrreca,d sb(ynttehsr)e;a ds )| , ^~~ tidInB/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hl:o162c:k5(:t warning: hvariable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized]r ead I162d | x . x ) ,d egfraouulpt(:g r o| up ^~~~~~~) , /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h :| 165 ^~~~~~~~~~~~~~~~~: 33: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hnote: :uninitialized use occurs here562 :60: note: 165field 'group' will be initialized after field 'stepSize' | co p562y | T o S h mteimd8((ttiidd)%,W AnRtPh_rSeIaZdEs,( ndtshtr,e asdrsc),, btyitdeIsn)B;l o c| k ^~~( threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ; \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdIn file included from x.x), /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cppg:r1o: up/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h(:g154r:o10u:p )warning: ,variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h :154562 | : 60 : note: cfield 'group' will be initialized after field 'stepSize'a se 3: 562| | ^ tid(tid), nthreads(nthr/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cppe:a5d:s9):, note: tin instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested herei dInBlo c5k | ( t h r e a d I dMxS.CxC)L,_ IgMrPoLu_pK(EgRrNoEuLp_)E,N T R| Y ^~~~~~~~~~~_ FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, f/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.hla:g5142:;9 : | warning: ^~~~~variable 'offset' set but not used [-Wunused-but-set-variable] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 514 | 153 | i n t oufifnste3t2 _=t tdiadt;a 1 ,| ^f lag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | In file included from i/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cppn:t1 : wIn file included from i/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hr:e13O: fIn file included from f/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.hs:e168t: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h=: 153W:i14r:e Wwarning: ounused variable 'data1' [-Wunused-variable]r dPerSlice*warp 153+ | 2 * w iudi;n t 3| 2 ^_ t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offsIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp271: | 1 : In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h : 13 : In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.hu:i169n: t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h6:4271_:t19*: pwarning: tunused variable 'ptr' [-Wunused-variable]r = recvPtr(0) +271l | l 1 2 8 O f f s euti;n t 6| 4 ^~~_ t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ et = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | msc/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ st, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp::4021:: 3/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:: 154note: :expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'10 : warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 402 | m s154c | c l R u ncIanstee r3p:r e t| e ^r , ProtoLL, false>' requested herey pe>, P r5o | t o L L 1 2 8 , MfSuClClLO_pIsM>P(Lc_oKmEmR,N EaLl_gEoN,T RwYo_rFkU); \ | ^ NC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hbytes):; 154 :| 10 ^~~: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h405: | 134 : 14m:s cnote: cinitialize the variable 'dst' to silence this warningl RunInterp r134e | t e r < tvyopied, *Fdusntc,# #*dservcr;e d o| p ^< t y| p = nullptre >, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h/:W134A:R14P:_ Snote: Iinitialize the variable 'dst' to silence this warningZ E), 134| | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZEv oid *509d | s t , *fslracg;T h r| e ^a d (| ( = nullptrt id%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | msIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:c1c: lIn file included from R/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hu:n13I: nIn file included from t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.he:r169p: re/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.ht:e509r:<29t:y pwarning: efield 'group' will be initialized after field 'stepSize' [-Wreorder-ctor], Func##devred o507p | < t y p et>i,d (Ptriodt)o,S inmtphlreeE,) ,f u l| l ~~~~~~~~~~~~~~~~~~O p s| > stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)( comm, 508a | l g o , wwaorrpkI)n;B l\o c k| ( ^t hrea/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hd:I165d:x33.:x /note: Wuninitialized use occurs hereA RP_SIZ E165) | , | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~c o p| y warp(tid/WARP_SIZET oShme m5098 | ( t i d %fWlAaRgPT_hSrIeZaEd,( (dtsti,d %s4rc),= =b3y)t,e sg)r; o u| p ^~~( group)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h,: 162 :| 5 ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~: warning: | variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 162 | 510 | d e f a usltte:p S i| z ^~~~~~~e (n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hc:c165l:S33h:m enote: muninitialized use occurs here .comm .165b | u f f S iczoepsy[TNoCSChLm_ePmR8O(TtOi_dL%LW1A2R8P_]S/INZCEC,L _dSsTtE,P Ss/rsci,z eboyft(eusi)n;t 6 4| _ ^~~t )) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h::402134::314:: note: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'initialize the variable 'dst' to silence this warning 134402 | | m svcocildR u*ndIsntt,e r*psrrect;e r <| t ^y p e| , = nullptr Func##devredop, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmeIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr m8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | PrimitivesIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_T, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ YPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSiz/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.he:(154n:c10c:l Swarning: hvariable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized]m em.comm.b u154f | f S i z ecsa[sNeC C3L:_ P R| O ^T O_LL128]/NCCL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cppS:T5E:P9S:/ snote: iin instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested herez eof(ui n5t | 6 4 _ t ) ) { M S| C ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~C L _| I group(groupM PL_KERNEL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hE:N217T:R57Y:_ Fnote: Uin instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested hereN C_DEV R217E | D O PP_rTiYmPiEt(iSvuems,< Td,o uRbeldeO,p ,f aFlasneA)s;y m m| e ^t ric<1,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h1:>402,: 31:, note: Pexpanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'r oto, 0> 402p | r i mmss c c| l ^R unIn/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cppt:e5r:p9r:e tnote: ein instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested herer K,E RPNrEoLt_oELNLT1R2Y8_,F UfNuCl_lDOEpVsR>E(DcOoPm_mT,Y PaEl(gSou,m ,w odroku)b;l e\, f| a ^l se)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h;: 165 :| 33 ^: note: uninitialized use occurs here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: 165note: | expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' cop y402T | o S hmmsecmc8l(RtuindI%nWtAeRrPp_rSeItZeEr,< tdyspte,, sFrucn,c #b#ydteevsr)e;d o p| < ^~~t ype>, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hP:r162o:t5o:L Lwarning: 1variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized]2 8, f162u | l l O p sd>e(fcaoumlmt,: a l| g ^~~~~~~o , /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hw:o165r:k33):; note: \uninitialized use occurs here | ^ 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, Prot/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ oSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx941. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 15 warnings generated when compiling for gfx90a. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSi/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr ze(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(grou/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ p), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), g/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roup(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h| : ^514 :9: warning: variable 'offset' set but not used [-Wunused-but-set-variable]/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h :165:33: note: uninitialized use occurs here 514 | i165n | t o f fcsoepty T=o Sthimde;m 8 (| t ^i d%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ :386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, byte/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ s); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ , flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlockIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | cop(yTtohSrhemaedmI8d(xt.ixd)%,W AgRrPo_uSpI(ZgEr,o udps)t,, s| r ^~~~~~~~~~~c , bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t datIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ a1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] ); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 15 warnings generated when compiling for gfx1100. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx1101. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr 15 warnings generated when compiling for gfx940. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 15 warnings generated when compiling for gfx906. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives , 1 ,c aPsreo t3o:, 0| > ^ prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp::55::99:: note: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested herein instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | 5 | M SMCSCCLC_LI_MIPMLP_LK_EKRENRENLE_LE_NETNRTYR_YF_UFNUCN_CD_EDVERVERDEODPO_PT_YTPYEP(EM(aMxa,x ,i nitn3t23_2t_,t ,f aflasles)e;) ; | ^| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h::3399:: 3note: :expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405399 | | mmssccccllRRuunnIInntteerrpprreetteerr<>,, PPrroottooSLiLm,p lfeu_(CcHoUmNmK,S TaElPgSo/,M SwCoCrLk_)S;L I\C E S| T ^E PS, /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hM:S165C:C33L:_ Snote: Luninitialized use occurs hereI CESTEPS >165, | f u l lcOoppsy>T(ocSohmmme,m 8a(ltgiod,% WwAoRrPk_)S;I Z\E , | d ^s t, s/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hr:c562,: 15b:y tnote: efield 'nthreads' will be initialized after field 'tidInBlock's ); | ^~~ 562 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.ht:i162d:(5t:i dwarning: )variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized], nt h162r | e a d s (dnetfharuelatd:s ) ,| ^~~~~~~t id/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hI:n165B:l33o:c knote: (uninitialized use occurs heret hread I165d | x . x ) ,c ogpryoTuopS(hgmreomu8p()t,i d %| W ^~~~~~~~~~~~~~~~~A RP_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hS:I562Z:E60,: dnote: sfield 'group' will be initialized after field 'stepSize't , src, 562b | y t e s )t;i d (| t ^~~i d), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter13,: In file included from P/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.hr:o167t: o/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hL:L562,: 15f:u lwarning: linitializer order does not match the declaration order [-Wreorder-ctor]O ps>(comm, a l562g | o , w otrikd)(;t i\d ) ,| ^n th/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hr:e165a:d33s:( nnote: tuninitialized use occurs hereh reads )165, | t i d IcnoBplyoTcokS(htmherme8a(dtIiddx%.Wx), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr PE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSliceIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ *warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx906. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] In file included from 153/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp | : 1 : In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hu:i13n: tIn file included from 3/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h2:_169t: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.hd:a271t:a191:, warning: funused variable 'ptr' [-Wunused-variable]l ag1, data2, f271l | a g 2 ; | ^~~~~ ui/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.hn:t1536:435_:t *warning: unused variable 'flag2' [-Wunused-variable]p tr = 153r | e c v P turi(n0t)3+2l_lt1 2d8aOtfaf1s,e tf;l a g| 1 ^~~, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ , data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | defauIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr lt: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ (Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 15 warnings generated when compiling for host. /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInter/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ preter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hr:e154a:d10s:( nwarning: tvariable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized]h reads), t i154d | I n B l occaks(et h3r:e a d| I ^d x.x), group(/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cppg:r5o:u9p:) ,note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)5 | 563 | M S C CsLt_eIpMSPiLz_eK(EnRcNcElLS_hEmNeTmR.Yc_oFmUmN.Cb_uDfEfVSRiEzDeOsP[_NTCYCPLE_(PMRaOxT,O _iSnItM8P_LtE,] /fNaClCsLe_)S;T E P| S ^/ sizeo/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hf:(402T:)3): {note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 402 | mscclRunI/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hn:t217e:r57p:r enote: tin instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested heree rp,, PFraontAosLyLm1m2e8t,r ifcus,> (1c,o mPmr,o taol,g o0,> wporrikm)s; \| ^ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp::1655::339:: note: note: uninitialized use occurs herein instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 1655 | | c o p y TMoSSChCmLe_mI8M(PtLi_dK%EWRANREPL__SEINZTER,Y _dFsUtN,C _sDrEcV,R EbDyOtPe_sT)Y;P E (| M ^~~a x, i/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hn:t1628:_5t:, warning: fvariable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized]a lse )162; | | ^ defaul/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.ht::405 : 3| : ^~~~~~~ note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h :165:33: note: uninitialized use occurs here 405 | 165m | s c c l RcuonpIynTtoeSrhpmreemt8e(rtt,e sP)r;o t o| S ^~~i mple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h :g134r:o14u:p (note: ginitialize the variable 'dst' to silence this warningr oup), 134 | | ^~~~~~~~~~~~~~~~~ v/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.ho:i562d: 60*:d snote: tfield 'group' will be initialized after field 'stepSize', *src ;562 | | ^ | t = nullptri d(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx803. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_half.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_half.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_half.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_half.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid)/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr , nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMax<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_double.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_double.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_double.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_double.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ type>, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1102. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_float.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_float.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_float.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_float.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ mscclRunInterpreter, ProtoSimple, f u134l | l O p s >v(ociodm m*,d satl,g o*,s rwco;r k )| ; ^ \ | = nullptr| ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscIn file included from c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cppl:R1u: n/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hI:n154t:e10r:p rwarning: evariable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized]t er, ProtoSimple, ProtoLL, false>' requested hereU NKSTEP S5/ | M S C C L _ S L IMCSECSCTLE_PISM,P LM_SKCECRLN_ESLL_IECNETSRTYE_PFSU>N,C _fDuElVlROEpDsO>P(_cToYmPmE,( Maalxg,o ,r cwcolr_kb)f;l o\a t 1| 6 ^, fals/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.he:)562;: 15 :| ^note: field 'nthreads' will be initialized after field 'tidInBlock' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399: 3562: | note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' tid(tid) ,399 | n t hmrsecacdlsR(unntIhnrteeadrsp)r,e tteird(,g rPourpo)t, o L| L ^~~~~~~~~~~~~~~~~, fu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.hl:l562O:p60s:> (note: cfield 'group' will be initialized after field 'stepSize'o mm, al g562o | , w o rtki)d;( t\i d )| , ^ nth/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hr:e165a:d33s:( nnote: tuninitialized use occurs hereh reads) ,165 | t i d I ncBolpoycTko(Sthhmreme8a(dtIiddx%.WxA)R,P _gSrIoZuEp,( gdrsotu,p )s,r c ,| ^~~~~~~~~~~b ytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterp/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ reter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Max, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Mi 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr n, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h)==3), g:r154o:u10p:(g rwarning: ovariable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized]u p), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | 154 | s tceapsSei z3e:( n c| c ^l Shmem.comm.buffSizes[NCCL_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cppP:R5O:T9O:_ Lnote: Lin instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here1 28]/NC C5L | _ S T E P S / s iMzSeCoCfL(_uIiMnPtL6_4K_EtR)N)E L{_ E N| T ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~R Y _| F group(groupU NC_DEVREDOP_/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hT:Y217P:E57(:M inote: nin instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here, int3 2217_ | t , Pfrailmsiet)i;v e s| < ^T , RedOp,/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h :F402a:n3A:s ynote: mexpanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'm etric<1 ,4021 | > , m1s,c cPlrRoutnoI,n t0e>r pprreitmesr < t| y ^p e, Fu/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cppn:c5#:#9d:e vnote: rin instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested heree dop , P r o t oMLSLC1C2L8_,I MfPuLl_lKOEpRsN>E(Lc_oEmNmT,R Ya_lFgUoN,C _wDoErVkR)E;D O\P _ T| Y ^P E(Min, i/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hn:t1653:233_:t ,note: uninitialized use occurs heref alse); 165| | ^ c/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.ho:p402y:T3o:S hnote: mexpanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'e m8(tid %402W | A R Pm_sScIcZlER,u ndIsntt,e rsprrce,t ebry/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h,: 162P:r5o:t owarning: Lvariable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized]L 128 ,162 | f u l l Odpesf>a(uclotm:m , | a ^~~~~~~l go/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h,: 165w:o33r:k )note: ;uninitialized use occurs here \ | ^ 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, p, FanAsymmetric<1,1>, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint8_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uIn file included from int64_t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp):)1 : { /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h| : ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~154 : 10| : group(group warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h : 217 : 57c:a snote: ein instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 3: | ^217 | Primitives ,note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here1 , Proto ,5 | 0 > p r i m s M S| C ^C L_IMP/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cppL:_5K:E9R:N Enote: Lin instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here_ ENTRY _5F | U N C _ D E V R EMDSOCPC_LT_YIPMEP(LM_iKnE,R NuEiLn_tE3N2T_RtY,_ FfUaNlCs_eD)E;V R E| D ^O P_TYPE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h(:M399i:n3,: unote: iexpanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'n t32_t, f399a | l s em)s;c c l| R ^u nInt/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.he:r402p:r3e:t enote: rexpanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'< type, F402u | n c #m#sdcecvlrReudnoIpne,t ePrrv(rceodmomp,< taylpgeo>,, wPorrokt)o;L L\1 2 8| , ^ fullOps>(com/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hm:,165 :a33l:g onote: ,uninitialized use occurs here work); \ 165 | | ^ copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint32_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 99%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/device_table.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/device_table.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/device_table.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/device_table.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/device_table.cpp gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp%4)==3),: 5g:r9o:u pnote: (in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested hereg roup), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 5 | M510S | C C L _ IsMtPeLp_SKiEzReN(EnLc_cElNSThRmYe_mF.UcNoCm_mD.EbVuRfEfDSOiPz_eTsY[PNEC(CMLi_nP,R OiTnOt_6L4L_1t2,8 ]f/aNlCsCeL)_;S T E| P ^S /sizeof(uint64_t/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h):)399 :{3 : | note: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' | group(group 399 | mscclRunInterpreter/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h<:t217yp:e57,: Fnote: uin instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested heren c##dev r217e | d o pPi,v ePsrs(ycmommemt,r iaclw,o r1k,) ;P r\o t o| , ^ 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h::9165:: 33note: :in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here note: uninitialized use occurs here 5 | 165 | c o pMySTCoCSLh_mIeMmP8L(_tKiEdR%NWEALR_PE_NSTIRZYE_,F UdNsCt_,D EsVrRcE,D ObPy_tTeYsP)E;( M i| n ^~~, int64_t, false); /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h :| 162 ^: 5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h: 402162: | 3 : note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'd efault: 402 | | ^~~~~~~ ms/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hc:c165l:R33u:n Inote: nuninitialized use occurs heret erpr e165t | e r < t ycpoep,y TFouSnhcm#e#md8e(vtriedd%oWpAZ,E ,P rdostto,L Ls1r2c8,, bfyutlelsO)p;s > (| c ^~~o mm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 15 warnings generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, int64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr ]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1030. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, uint64_t, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_double.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_double.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_double.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_double.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | msIn file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr cclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_double.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, double, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_float.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_float.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_float.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_float.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recv/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.hP:t386r:(90:) +warning: lvariable 'wireOffset' set but not used [-Wunused-but-set-variable]l 128Offs e386t | ; | ^~~i nt wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, wor/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:k217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here ); \ 217 | | ^ Primitives, 1, Proto, 0 >165 | p r i m sc o p| y ^T oShme/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cppm:85(:t9i:d %note: Win instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested hereA RP_SI Z5E | , d s t , s rMcS,C CbLy_tIeMsP)L;_ K E| R ^~~N EL_ENTRY_FUNC_DE/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.hV:R162E:D5O:P _warning: Tvariable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized]Y PE( M162i | n , f ldoeafta,u lfta:l s e| ) ^~~~~~~; /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h| : ^165 :33/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:: 402note: :uninitialized use occurs here3 : note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 165 | 402c | o p ymTsocSchlmReumn8I(nttiedr%pWrAeRtPe_rS , ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ _STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_float.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, float, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 99%] Building CXX object CMakeFiles/rccl.dir/git_version.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/git_version.cpp.o -MF CMakeFiles/rccl.dir/git_version.cpp.o.d -o CMakeFiles/rccl.dir/git_version.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/git_version.cpp gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_half.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_half.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_half.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_half.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, w/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ork); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx900. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx90a. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMin<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_half.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMin<__half>, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, half, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 99%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/host_table.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/host_table.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/host_table.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/host_table.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/host_table.cpp gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp.o /usr/bin/clang++ -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_UNCACHED_MEMORY -DNVTX_NO_IMPL -DROCM_VERSION=60102 -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/include -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives -I/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device -pipe -frecord-gcc-switches -Wall -g -O2 -std=c++14 -fPIC -parallel-jobs=12 -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -mllvm=-amdgpu-early-inline-all=true -mllvm=-amdgpu-function-calls=false -x hip --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp.o -c /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx1030. 15 warnings generated when compiling for gfx940. 15 warnings generated when compiling for gfx1100. 15 warnings generated when compiling for gfx803. 15 warnings generated when compiling for gfx941. 15 warnings generated when compiling for gfx908. 15 warnings generated when compiling for gfx906. 15 warnings generated when compiling for gfx1102. 15 warnings generated when compiling for gfx900. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx1101. 15 warnings generated when compiling for host. 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:168: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:14: warning: unused variable 'data1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:21: warning: unused variable 'flag1' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:28: warning: unused variable 'data2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:153:35: warning: unused variable 'flag2' [-Wunused-variable] 153 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll.h:514:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 514 | int offset = tid; | ^ In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:271:19: warning: unused variable 'ptr' [-Wunused-variable] 271 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:386:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 386 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ 15 warnings generated when compiling for gfx90a. In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:399:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 399 | mscclRunInterpreter, ProtoLL, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:169: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_ll128.h:509:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 507 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 508 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 509 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 510 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:154:10: warning: variable 'dst' is used uninitialized whenever switch case is taken [-Wsometimes-uninitialized] 154 | case 3: | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:162:5: warning: variable 'dst' is used uninitialized whenever switch default is taken [-Wsometimes-uninitialized] 162 | default: | ^~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:165:33: note: uninitialized use occurs here 165 | copyToShmem8(tid%WARP_SIZE, dst, src, bytes); | ^~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:134:14: note: initialize the variable 'dst' to silence this warning 134 | void *dst, *src; | ^ | = nullptr In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:1: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:13: In file included from /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/primitives.h:167: /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) 563 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp:5:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 5 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Min, rccl_bfloat16, false); | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/hipify/src/collectives/device/prims_simple.h:562:60: note: field 'group' will be initialized after field 'stepSize' 562 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for gfx942. gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[2]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [100%] Linking CXX shared library librccl.so /usr/bin/cmake -E cmake_link_script CMakeFiles/rccl.dir/link.txt --verbose=1 /usr/bin/cmake -E time /usr/bin/clang++ -fPIC -pipe -frecord-gcc-switches -Wall -g -O2 -parallel-jobs=16 -Xoffload-linker -mllvm=-amdgpu-kernarg-preload-count=16 -shared -Wl,-soname,librccl.so.1 -o librccl.so.1.0 CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o CMakeFiles/rccl.dir/hipify/src/channel.cc.o CMakeFiles/rccl.dir/hipify/src/collectives/all_gather.cc.o CMakeFiles/rccl.dir/hipify/src/collectives/all_reduce.cc.o CMakeFiles/rccl.dir/hipify/src/collectives/all_to_all.cc.o CMakeFiles/rccl.dir/hipify/src/collectives/all_to_allv.cc.o CMakeFiles/rccl.dir/hipify/src/collectives/broadcast.cc.o CMakeFiles/rccl.dir/hipify/src/collectives/msccl.cc.o CMakeFiles/rccl.dir/hipify/src/collectives/device/onerank_reduce.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/gather.cc.o CMakeFiles/rccl.dir/hipify/src/collectives/reduce.cc.o CMakeFiles/rccl.dir/hipify/src/collectives/reduce_scatter.cc.o CMakeFiles/rccl.dir/hipify/src/collectives/scatter.cc.o CMakeFiles/rccl.dir/hipify/src/collectives/sendrecv.cc.o CMakeFiles/rccl.dir/hipify/src/debug.cc.o CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o CMakeFiles/rccl.dir/hipify/src/group.cc.o CMakeFiles/rccl.dir/hipify/src/init.cc.o CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o CMakeFiles/rccl.dir/hipify/src/net.cc.o CMakeFiles/rccl.dir/hipify/src/proxy.cc.o CMakeFiles/rccl.dir/hipify/src/transport.cc.o CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllGather_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/AllToAllPivot_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Broadcast_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/Reduce_RING_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Max.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_Min.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/SendRecv_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_half.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_float.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_double.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Sum_rccl_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_half.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_float.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_double.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Prod_rccl_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_half.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_float.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_double.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Max_rccl_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_half.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_float.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_double.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/msccl_kernel_Min_rccl_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/device_table.cpp.o CMakeFiles/rccl.dir/hipify/src/collectives/device/host_table.cpp.o CMakeFiles/rccl.dir/git_version.cpp.o -fgpu-rdc -ldl /usr/lib64/librocm_smi64.so.1.0 /usr/lib64/libamdhip64.so.6.1.40093 --hip-link --offload-arch=gfx803 --offload-arch=gfx900:xnack- --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx940 --offload-arch=gfx941 --offload-arch=gfx942 --offload-arch=gfx1030 --offload-arch=gfx1100 --offload-arch=gfx1101 --offload-arch=gfx1102 /usr/lib/llvm-rocm/lib64/clang/17/lib/linux/libclang_rt.builtins-x86_64.a -lpthread -lrt -ldl Elapsed time (seconds): 829.701 /usr/bin/cmake -E cmake_symlink_library librccl.so.1.0 librccl.so.1 librccl.so gmake[2]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake[1]: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' [100%] Built target rccl gmake[1]: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' gmake: Entering directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' /usr/bin/cmake -E cmake_progress_start /usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux/CMakeFiles 0 gmake: Leaving directory '/usr/src/RPM/BUILD/rccl-2.18.6/x86_64-alt-linux' + exit 0 Executing(%install): /bin/sh -e /usr/src/tmp/rpm-tmp.94844 + umask 022 + /bin/mkdir -p /usr/src/RPM/BUILD + cd /usr/src/RPM/BUILD + /bin/chmod -Rf u+rwX -- /usr/src/tmp/rccl-buildroot + : + /bin/rm -rf -- /usr/src/tmp/rccl-buildroot + PATH=/usr/libexec/rpm-build:/usr/src/bin:/usr/bin:/bin:/usr/local/bin:/usr/games + cd rccl-2.18.6 + DESTDIR=/usr/src/tmp/rccl-buildroot + cmake --install x86_64-alt-linux --verbose -- Install configuration: "" -- Installing: /usr/src/tmp/rccl-buildroot/usr/lib64/librccl.so.1.0 -- Installing: /usr/src/tmp/rccl-buildroot/usr/lib64/librccl.so.1 -- Installing: /usr/src/tmp/rccl-buildroot/usr/lib64/librccl.so -- Installing: /usr/src/tmp/rccl-buildroot/usr/include/rccl/rccl.h -- Installing: /usr/src/tmp/rccl-buildroot/usr/include/rccl/nccl_net.h -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allgather-8n-0-1kb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allgather-8n-1kb-4kb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allgather-8n-1mb-4mb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allgather-8n-4kb-8kb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allgather-8n-4mb-16mb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allgather-8n-8kb-1mb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allgather-allpairs-16n-16tb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allreduce-allpairs-16n-16tb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allreduce-allpairs-16n-32tb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-1pass.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-32tb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-64tb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-simple.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/alltoall-8n-0-1kb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/alltoall-8n-1kb-4kb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/alltoall-8n-1mb-4mb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/alltoall-8n-4kb-8kb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/alltoall-8n-4mb-16mb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-algorithms/alltoall-8n-8kb-1mb.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-unit-test-algorithms -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-unit-test-algorithms/all-reduce-ring-ll.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-unit-test-algorithms/all-reduce-ring-ll128.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/rccl/msccl-unit-test-algorithms/all-reduce-ring-simple.xml -- Installing: /usr/src/tmp/rccl-buildroot/usr/lib64/cmake/rccl/rccl-targets.cmake -- Installing: /usr/src/tmp/rccl-buildroot/usr/lib64/cmake/rccl/rccl-targets-noconfig.cmake -- Installing: /usr/src/tmp/rccl-buildroot/usr/lib64/cmake/rccl/rccl-config.cmake -- Installing: /usr/src/tmp/rccl-buildroot/usr/lib64/cmake/rccl/rccl-config-version.cmake -- Installing: /usr/src/tmp/rccl-buildroot/usr/share/doc/rccl/LICENSE.txt + rm -rf /usr/src/tmp/rccl-buildroot/usr/rccl + rm -rf /usr/src/tmp/rccl-buildroot/usr/share/doc/rccl + /usr/lib/rpm/brp-alt Cleaning files in /usr/src/tmp/rccl-buildroot (auto) mode of './usr/lib64/librccl.so.1.0' changed from 0755 (rwxr-xr-x) to 0644 (rw-r--r--) Verifying and fixing files in /usr/src/tmp/rccl-buildroot (binconfig,pkgconfig,libtool,desktop,gnuconfig) Checking contents of files in /usr/src/tmp/rccl-buildroot/ (default) Compressing files in /usr/src/tmp/rccl-buildroot (auto) Adjusting library links in /usr/src/tmp/rccl-buildroot ./usr/lib64: (from :0) librccl.so.1 -> librccl.so.1.0 Verifying ELF objects in /usr/src/tmp/rccl-buildroot (arch=normal,fhs=normal,lfs=relaxed,lint=relaxed,rpath=normal,stack=normal,textrel=normal,unresolved=normal) section [ 3] '.dynsym': symbol 338 (__hip_fatbin): symbol in dynamic symbol table with non-default visibility verify-elf: WARNING: ./usr/lib64/librccl.so.1.0: eu-elflint failed Splitting links to aliased files under /{,s}bin in /usr/src/tmp/rccl-buildroot Processing files: librccl1-2.18.6-alt0.1 Executing(%doc): /bin/sh -e /usr/src/tmp/rpm-tmp.44779 + umask 022 + /bin/mkdir -p /usr/src/RPM/BUILD + cd /usr/src/RPM/BUILD + cd rccl-2.18.6 + DOCDIR=/usr/src/tmp/rccl-buildroot/usr/share/doc/librccl1-2.18.6 + export DOCDIR + rm -rf /usr/src/tmp/rccl-buildroot/usr/share/doc/librccl1-2.18.6 + /bin/mkdir -p /usr/src/tmp/rccl-buildroot/usr/share/doc/librccl1-2.18.6 + cp -prL README.md LICENSE.txt NOTICES.txt CHANGELOG.md /usr/src/tmp/rccl-buildroot/usr/share/doc/librccl1-2.18.6 + chmod -R go-w /usr/src/tmp/rccl-buildroot/usr/share/doc/librccl1-2.18.6 + chmod -R a+rX /usr/src/tmp/rccl-buildroot/usr/share/doc/librccl1-2.18.6 + exit 0 Finding Provides (using /usr/lib/rpm/find-provides) Executing: /bin/sh -e /usr/src/tmp/rpm-tmp.boXTKL find-provides: running scripts (alternatives,debuginfo,lib,pam,perl,pkgconfig,python,python3,shell) lib.prov: /usr/src/tmp/rccl-buildroot/usr/lib64/librccl.so.1: 192 symbols, 18 bpp Finding Requires (using /usr/lib/rpm/find-requires) Executing: /bin/sh -e /usr/src/tmp/rpm-tmp.rol7c6 find-requires: running scripts (cpp,debuginfo,files,lib,pam,perl,pkgconfig,pkgconfiglib,python,python3,rpmlib,shebang,shell,static,symlinks,systemd-services) warning: librccl1 provides another subpackage: rccl Provides: rccl = 2.18.6-alt0.1, librccl.so.1()(64bit) = set:ldySY8WxOALBnhFpKYr8hTuOp4f4mGu2jLdMJjcZCXM47UXuwyyGRGWXKgETcgdjMi5wuDQ3qOxtZBm81J7pYPMIUZa5VdctQkKefUrjndPqhuFfak8KACxDBZ2WZJDfvJzZ89VmVuIkNiinUuRvWX09AlpiViW0mDiqb8i3YJossrximfgU5FDIg3bfAM3p87RAKcG4MZinBzsSGNgsBCROo9k0v79172vNT21EO938Mcw8TzCb018bhHvvzgmTvhhNQWFQoI4SSRedfYZyMcS4HABqmacW4xzCUZaO5x9LSUxVFl0qy5C7FFGgAn04Hyxww4hPwz6LsL4UDEnEe2dpGZx29zB56rIHYGcZG1BqjQafIX1WE3sbDhXCpfBjMq4 Requires: ld-linux-x86-64.so.2()(64bit) >= set:jiids, ld-linux-x86-64.so.2(GLIBC_2.3)(64bit), libamdhip64.so.6()(64bit) >= set:mgEl4iHah5shPP2z5A5zYttYI7XpZyRnhe1J6ZgwULwPlWeYZ4XbZd2bItRMqeW4hZmmUYmDZdpDnrYqkUKOuzfUwKzIyQItN97gggSsa6v6KYBa3m70aJ49gh1ckMQcuEPMZKgWZw, libamdhip64.so.6(hip_4.2)(64bit), libamdhip64.so.6(hip_4.3)(64bit), libamdhip64.so.6(hip_4.5)(64bit), libamdhip64.so.6(hip_5.0)(64bit), libamdhip64.so.6(hip_5.3)(64bit), libamdhip64.so.6(hip_6.0)(64bit), libc.so.6(GLIBC_2.14)(64bit), libc.so.6(GLIBC_2.17)(64bit), libc.so.6(GLIBC_2.2.5)(64bit), libc.so.6(GLIBC_2.3)(64bit), libc.so.6(GLIBC_2.3.2)(64bit), libc.so.6(GLIBC_2.3.4)(64bit), libc.so.6(GLIBC_2.33)(64bit), libc.so.6(GLIBC_2.34)(64bit), libc.so.6(GLIBC_2.38)(64bit), libc.so.6(GLIBC_2.6)(64bit), libgcc_s.so.1(GCC_3.0)(64bit), libm.so.6(GLIBC_2.2.5)(64bit), librocm_smi64.so.1()(64bit) >= set:miSwa9ZECgdMsH9hGiyEU5mNQ1, libstdc++.so.6(CXXABI_1.3)(64bit), libstdc++.so.6(CXXABI_1.3.5)(64bit), libstdc++.so.6(CXXABI_1.3.7)(64bit), libstdc++.so.6(GLIBCXX_3.4)(64bit), libstdc++.so.6(GLIBCXX_3.4.11)(64bit), libstdc++.so.6(GLIBCXX_3.4.18)(64bit), libstdc++.so.6(GLIBCXX_3.4.19)(64bit), libstdc++.so.6(GLIBCXX_3.4.21)(64bit), libstdc++.so.6(GLIBCXX_3.4.22)(64bit), libstdc++.so.6(GLIBCXX_3.4.29)(64bit), rtld(GNU_HASH) Requires(rpmlib): rpmlib(SetVersions) Finding debuginfo files (using /usr/lib/rpm/find-debuginfo-files) Executing: /bin/sh -e /usr/src/tmp/rpm-tmp.UfkSLO Creating librccl1-debuginfo package Processing files: librccl-devel-2.18.6-alt0.1 Finding Provides (using /usr/lib/rpm/find-provides) Executing: /bin/sh -e /usr/src/tmp/rpm-tmp.ortCY5 find-provides: running scripts (alternatives,debuginfo,lib,pam,perl,pkgconfig,python,python3,shell) Finding Requires (using /usr/lib/rpm/find-requires) Executing: /bin/sh -e /usr/src/tmp/rpm-tmp.hZlR3r find-requires: running scripts (cpp,debuginfo,files,lib,pam,perl,pkgconfig,pkgconfiglib,python,python3,rpmlib,shebang,shell,static,symlinks,systemd-services) In file included from /usr/src/tmp/rccl-buildroot/usr/include/rccl/rccl.h:12: /usr/include/hip/hip_runtime.h:66:2: error: #error ("Must define exactly one of __HIP_PLATFORM_AMD__ or __HIP_PLATFORM_NVIDIA__"); 66 | #error("Must define exactly one of __HIP_PLATFORM_AMD__ or __HIP_PLATFORM_NVIDIA__"); | ^~~~~ In file included from /usr/include/hip/hip_runtime.h:70: /usr/include/hip/hip_runtime_api.h:8852:2: error: #error ("Must define exactly one of __HIP_PLATFORM_AMD__ or __HIP_PLATFORM_NVIDIA__"); 8852 | #error("Must define exactly one of __HIP_PLATFORM_AMD__ or __HIP_PLATFORM_NVIDIA__"); | ^~~~~ In file included from /usr/include/hip/hip_runtime.h:71: /usr/include/hip/library_types.h:75:2: error: #error ("Must define exactly one of __HIP_PLATFORM_AMD__ or __HIP_PLATFORM_NVIDIA__"); 75 | #error("Must define exactly one of __HIP_PLATFORM_AMD__ or __HIP_PLATFORM_NVIDIA__"); | ^~~~~ In file included from /usr/include/hip/hip_runtime.h:73: /usr/include/hip/hip_vector_types.h:38:2: error: #error ("Must define exactly one of __HIP_PLATFORM_AMD__ or __HIP_PLATFORM_NVIDIA__"); 38 | #error("Must define exactly one of __HIP_PLATFORM_AMD__ or __HIP_PLATFORM_NVIDIA__"); | ^~~~~ In file included from /usr/src/tmp/rccl-buildroot/usr/include/rccl/rccl.h:13: /usr/include/hip/hip_fp16.h:33:2: error: #error ("Must define exactly one of __HIP_PLATFORM_AMD__ or __HIP_PLATFORM_NVIDIA__"); 33 | #error("Must define exactly one of __HIP_PLATFORM_AMD__ or __HIP_PLATFORM_NVIDIA__"); | ^~~~~ cpp.req: /usr/src/tmp/rccl-buildroot/usr/include/rccl/rccl.h: cpp failed, trying c++ mode x86_64-alt-linux-cpp: fatal error: cannot execute 'cc1plus': execvp: No such file or directory compilation terminated. cpp.req: WARNING: /usr/src/tmp/rccl-buildroot/usr/include/rccl/rccl.h: cpp failed /usr/src/tmp/rccl-buildroot/usr/include/rccl/nccl_net.h:10:10: fatal error: nccl.h: No such file or directory 10 | #include "nccl.h" | ^~~~~~~~ compilation terminated. cpp.req: WARNING: /usr/src/tmp/rccl-buildroot/usr/include/rccl/nccl_net.h: cpp failed Provides: rccl-devel = 2.18.6-alt0.1 Requires: /usr/lib64/librccl.so.1 Finding debuginfo files (using /usr/lib/rpm/find-debuginfo-files) Executing: /bin/sh -e /usr/src/tmp/rpm-tmp.tEPSSh Processing files: librccl1-debuginfo-2.18.6-alt0.1 Finding Provides (using /usr/lib/rpm/find-provides) Executing: /bin/sh -e /usr/src/tmp/rpm-tmp.8oxlti find-provides: running scripts (debuginfo) Finding Requires (using /usr/lib/rpm/find-requires) Executing: /bin/sh -e /usr/src/tmp/rpm-tmp.pIcLnw find-requires: running scripts (debuginfo) Provides: debug64(librccl.so.1) Requires: librccl1 = 2.18.6-alt0.1, debug64(ld-linux-x86-64.so.2), debug64(libamdhip64.so.6), debug64(libc.so.6), debug64(libgcc_s.so.1), debug64(libm.so.6), debug64(librocm_smi64.so.1), debug64(libstdc++.so.6) Adding to librccl1-debuginfo a strict dependency on librccl1 Adding to librccl-devel a strict dependency on librccl1 Removing 1 extra deps from librccl-devel due to dependency on librccl1 Wrote: /usr/src/RPM/RPMS/x86_64/librccl1-2.18.6-alt0.1.x86_64.rpm (w2T8.xzdio) Wrote: /usr/src/RPM/RPMS/x86_64/librccl-devel-2.18.6-alt0.1.x86_64.rpm (w2T8.xzdio) Wrote: /usr/src/RPM/RPMS/x86_64/librccl1-debuginfo-2.18.6-alt0.1.x86_64.rpm (w2.lzdio) 19965.54user 515.08system 44:41.55elapsed 763%CPU (0avgtext+0avgdata 5539576maxresident)k 50952inputs+0outputs (79major+82958292minor)pagefaults 0swaps /.out/librccl1-2.18.6-alt0.1.x86_64.rpm: bad symbols in the license tag: // /.out/librccl-devel-2.18.6-alt0.1.x86_64.rpm: bad symbols in the license tag: // /.out/librccl1-debuginfo-2.18.6-alt0.1.x86_64.rpm: bad symbols in the license tag: // 11.82user 3.62system 47:51.16elapsed 0%CPU (0avgtext+0avgdata 136020maxresident)k 1894712inputs+0outputs (0major+314577minor)pagefaults 0swaps --- librccl1-2.18.6-alt0.1.x86_64.rpm.repo 2024-08-13 08:56:51.000000000 +0000 +++ librccl1-2.18.6-alt0.1.x86_64.rpm.hasher 2024-09-07 00:49:36.646216730 +0000 @@ -46,3 +46,3 @@ File: /usr/lib64/librccl.so.1 120777 root:root librccl.so.1.0 -File: /usr/lib64/librccl.so.1.0 100644 root:root 2e5c3ab2b95eede8c321abb70ecf8073 +File: /usr/lib64/librccl.so.1.0 100644 root:root 86d8f01d32ab1266e2b61948dc29ae2b File: /usr/share/doc/librccl1-2.18.6 40755 root:root @@ -52,2 +52,2 @@ File: /usr/share/doc/librccl1-2.18.6/README.md 100644 root:root 7f63560222074951adb129e12c2ea047 -RPMIdentity: e713b9c77db3c8749c70a5cd7ad4ea3e27866bc78e36d700dc50200eab38283472282f7d4b17396a7025a778ee2ab574f956b3a1db80316db878d3e5f095ae6d +RPMIdentity: 027643801ba16e8849a51668920b4c9b2300569ec06de51aa662027fd96c699702c5b7d7791898de3593390cce35ceeabc4a6c23d2df0c60a74dedea4f662c44 --- librccl1-debuginfo-2.18.6-alt0.1.x86_64.rpm.repo 2024-08-13 08:56:50.000000000 +0000 +++ librccl1-debuginfo-2.18.6-alt0.1.x86_64.rpm.hasher 2024-09-07 00:49:36.724216890 +0000 @@ -1,4 +1,4 @@ -/usr/lib/debug/.build-id/06 40755 root:root -/usr/lib/debug/.build-id/06/e0e74b54f4c9a58ada6b6594323d08d8b96adb 120777 root:root ../../../../lib64/librccl.so.1.0 -/usr/lib/debug/.build-id/06/e0e74b54f4c9a58ada6b6594323d08d8b96adb.debug 120777 root:root ../../usr/lib64/librccl.so.1.0.debug +/usr/lib/debug/.build-id/90 40755 root:root +/usr/lib/debug/.build-id/90/505a914e78ab44502ae1d1e927623326d7e266 120777 root:root ../../../../lib64/librccl.so.1.0 +/usr/lib/debug/.build-id/90/505a914e78ab44502ae1d1e927623326d7e266.debug 120777 root:root ../../usr/lib64/librccl.so.1.0.debug /usr/lib/debug/usr/lib64/librccl.so.1.0.debug 100644 root:root @@ -300,6 +300,6 @@ Provides: librccl1-debuginfo = 2.18.6-alt0.1:sisyphus+353658.300.4.1 -File: /usr/lib/debug/.build-id/06 40755 root:root -File: /usr/lib/debug/.build-id/06/e0e74b54f4c9a58ada6b6594323d08d8b96adb 120777 root:root ../../../../lib64/librccl.so.1.0 -File: /usr/lib/debug/.build-id/06/e0e74b54f4c9a58ada6b6594323d08d8b96adb.debug 120777 root:root ../../usr/lib64/librccl.so.1.0.debug -File: /usr/lib/debug/usr/lib64/librccl.so.1.0.debug 100644 root:root f8eef68f4c9d90c9baa5adae3fa5e884 +File: /usr/lib/debug/.build-id/90 40755 root:root +File: /usr/lib/debug/.build-id/90/505a914e78ab44502ae1d1e927623326d7e266 120777 root:root ../../../../lib64/librccl.so.1.0 +File: /usr/lib/debug/.build-id/90/505a914e78ab44502ae1d1e927623326d7e266.debug 120777 root:root ../../usr/lib64/librccl.so.1.0.debug +File: /usr/lib/debug/usr/lib64/librccl.so.1.0.debug 100644 root:root e6d1140ed4f1dec79d9562080a23ec9e File: /usr/lib/debug/usr/lib64/librccl.so.1.debug 120777 root:root librccl.so.1.0.debug @@ -589,2 +589,2 @@ File: /usr/src/debug/rccl-2.18.6/x86_64-alt-linux/include/nccl.h 100644 root:root 88c99b744f34dbc0b9c2f53fd9431572 -RPMIdentity: 29d02fa69e031265be273d534b520a374d6107348fa62b1cdfa2b723d006c08d734c8e9950fc8dc604603c646100fa1259f3fc5a5cb1d982dd16a747e0d1d189 +RPMIdentity: 8cc88d71ca996b3f09251fe56bb594d620a11baf49fecdf1fd468f9eaccd6f228113750307d5bd3f6fd6123fa8e2bdf29e79062b88211067b79e15f4b5b1ccd0